• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #4872

04 Dec 2025 01:55AM UTC coverage: 64.678% (+0.02%) from 64.654%
#4872

push

travis-ci

guanshengliang
Merge branch '3.0' into cover/3.0

880 of 2219 new or added lines in 36 files covered. (39.66%)

6146 existing lines in 122 files now uncovered.

159679 of 246882 relevant lines covered (64.68%)

110947965.82 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

66.9
/source/dnode/mnode/impl/src/mndVgroup.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15

16
#define _DEFAULT_SOURCE
17
#include "audit.h"
18
#include "mndArbGroup.h"
19
#include "mndDb.h"
20
#include "mndDnode.h"
21
#include "mndMnode.h"
22
#include "mndPrivilege.h"
23
#include "mndShow.h"
24
#include "mndStb.h"
25
#include "mndStream.h"
26
#include "mndTopic.h"
27
#include "mndTrans.h"
28
#include "mndUser.h"
29
#include "mndVgroup.h"
30
#include "tmisce.h"
31

32
#define VGROUP_VER_NUMBER   1
33
#define VGROUP_RESERVE_SIZE 60
34

35
static int32_t mndVgroupActionInsert(SSdb *pSdb, SVgObj *pVgroup);
36
static int32_t mndVgroupActionDelete(SSdb *pSdb, SVgObj *pVgroup);
37
static int32_t mndVgroupActionUpdate(SSdb *pSdb, SVgObj *pOld, SVgObj *pNew);
38
static int32_t mndNewVgActionValidate(SMnode *pMnode, STrans *pTrans, SSdbRaw *pRaw);
39

40
static int32_t mndRetrieveVgroups(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows);
41
static void    mndCancelGetNextVgroup(SMnode *pMnode, void *pIter);
42
static int32_t mndRetrieveVnodes(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows);
43
static void    mndCancelGetNextVnode(SMnode *pMnode, void *pIter);
44

45
static int32_t mndProcessRedistributeVgroupMsg(SRpcMsg *pReq);
46
static int32_t mndProcessSplitVgroupMsg(SRpcMsg *pReq);
47
static int32_t mndProcessBalanceVgroupMsg(SRpcMsg *pReq);
48
static int32_t mndProcessVgroupBalanceLeaderMsg(SRpcMsg *pReq);
49
static int32_t mndProcessSetVgroupKeepVersionReq(SRpcMsg *pReq);
50

51
int32_t mndInitVgroup(SMnode *pMnode) {
488,825✔
52
  SSdbTable table = {
488,825✔
53
      .sdbType = SDB_VGROUP,
54
      .keyType = SDB_KEY_INT32,
55
      .encodeFp = (SdbEncodeFp)mndVgroupActionEncode,
56
      .decodeFp = (SdbDecodeFp)mndVgroupActionDecode,
57
      .insertFp = (SdbInsertFp)mndVgroupActionInsert,
58
      .updateFp = (SdbUpdateFp)mndVgroupActionUpdate,
59
      .deleteFp = (SdbDeleteFp)mndVgroupActionDelete,
60
      .validateFp = (SdbValidateFp)mndNewVgActionValidate,
61
  };
62

63
  mndSetMsgHandle(pMnode, TDMT_DND_CREATE_VNODE_RSP, mndTransProcessRsp);
488,825✔
64
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_REPLICA_RSP, mndTransProcessRsp);
488,825✔
65
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_CONFIG_RSP, mndTransProcessRsp);
488,825✔
66
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_CONFIRM_RSP, mndTransProcessRsp);
488,825✔
67
  mndSetMsgHandle(pMnode, TDMT_VND_SET_KEEP_VERSION_RSP, mndTransProcessRsp);
488,825✔
68
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_HASHRANGE_RSP, mndTransProcessRsp);
488,825✔
69
  mndSetMsgHandle(pMnode, TDMT_DND_DROP_VNODE_RSP, mndTransProcessRsp);
488,825✔
70
  mndSetMsgHandle(pMnode, TDMT_VND_COMPACT_RSP, mndTransProcessRsp);
488,825✔
71
  mndSetMsgHandle(pMnode, TDMT_VND_SCAN_RSP, mndTransProcessRsp);
488,825✔
72
  mndSetMsgHandle(pMnode, TDMT_VND_DISABLE_WRITE_RSP, mndTransProcessRsp);
488,825✔
73
  mndSetMsgHandle(pMnode, TDMT_SYNC_FORCE_FOLLOWER_RSP, mndTransProcessRsp);
488,825✔
74
  mndSetMsgHandle(pMnode, TDMT_VND_ALTER_ELECTBASELINE_RSP, mndTransProcessRsp);
488,825✔
75
  
76
  mndSetMsgHandle(pMnode, TDMT_DND_ALTER_VNODE_TYPE_RSP, mndTransProcessRsp);
488,825✔
77
  mndSetMsgHandle(pMnode, TDMT_DND_CHECK_VNODE_LEARNER_CATCHUP_RSP, mndTransProcessRsp);
488,825✔
78
  mndSetMsgHandle(pMnode, TDMT_SYNC_CONFIG_CHANGE_RSP, mndTransProcessRsp);
488,825✔
79

80
  mndSetMsgHandle(pMnode, TDMT_MND_REDISTRIBUTE_VGROUP, mndProcessRedistributeVgroupMsg);
488,825✔
81
  mndSetMsgHandle(pMnode, TDMT_MND_SPLIT_VGROUP, mndProcessSplitVgroupMsg);
488,825✔
82
  // mndSetMsgHandle(pMnode, TDMT_MND_BALANCE_VGROUP, mndProcessVgroupBalanceLeaderMsg);
83
  mndSetMsgHandle(pMnode, TDMT_MND_BALANCE_VGROUP, mndProcessBalanceVgroupMsg);
488,825✔
84
  mndSetMsgHandle(pMnode, TDMT_MND_BALANCE_VGROUP_LEADER, mndProcessVgroupBalanceLeaderMsg);
488,825✔
85
  mndSetMsgHandle(pMnode, TDMT_MND_SET_VGROUP_KEEP_VERSION, mndProcessSetVgroupKeepVersionReq);
488,825✔
86

87
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_VGROUP, mndRetrieveVgroups);
488,825✔
88
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_VGROUP, mndCancelGetNextVgroup);
488,825✔
89
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_VNODES, mndRetrieveVnodes);
488,825✔
90
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_VNODES, mndCancelGetNextVnode);
488,825✔
91

92
  return sdbSetTable(pMnode->pSdb, table);
488,825✔
93
}
94

95
void mndCleanupVgroup(SMnode *pMnode) {}
488,059✔
96

97
SSdbRaw *mndVgroupActionEncode(SVgObj *pVgroup) {
11,421,225✔
98
  int32_t code = 0;
11,421,225✔
99
  int32_t lino = 0;
11,421,225✔
100
  terrno = TSDB_CODE_OUT_OF_MEMORY;
11,421,225✔
101

102
  SSdbRaw *pRaw = sdbAllocRaw(SDB_VGROUP, VGROUP_VER_NUMBER, sizeof(SVgObj) + VGROUP_RESERVE_SIZE);
11,421,225✔
103
  if (pRaw == NULL) goto _OVER;
11,421,225✔
104

105
  int32_t dataPos = 0;
11,421,225✔
106
  SDB_SET_INT32(pRaw, dataPos, pVgroup->vgId, _OVER)
11,421,225✔
107
  SDB_SET_INT64(pRaw, dataPos, pVgroup->createdTime, _OVER)
11,421,225✔
108
  SDB_SET_INT64(pRaw, dataPos, pVgroup->updateTime, _OVER)
11,421,225✔
109
  SDB_SET_INT32(pRaw, dataPos, pVgroup->version, _OVER)
11,421,225✔
110
  SDB_SET_INT32(pRaw, dataPos, pVgroup->hashBegin, _OVER)
11,421,225✔
111
  SDB_SET_INT32(pRaw, dataPos, pVgroup->hashEnd, _OVER)
11,421,225✔
112
  SDB_SET_BINARY(pRaw, dataPos, pVgroup->dbName, TSDB_DB_FNAME_LEN, _OVER)
11,421,225✔
113
  SDB_SET_INT64(pRaw, dataPos, pVgroup->dbUid, _OVER)
11,421,225✔
114
  SDB_SET_INT8(pRaw, dataPos, pVgroup->isTsma, _OVER)
11,421,225✔
115
  SDB_SET_INT8(pRaw, dataPos, pVgroup->replica, _OVER)
11,421,225✔
116
  for (int8_t i = 0; i < pVgroup->replica; ++i) {
25,235,054✔
117
    SVnodeGid *pVgid = &pVgroup->vnodeGid[i];
13,813,829✔
118
    SDB_SET_INT32(pRaw, dataPos, pVgid->dnodeId, _OVER)
13,813,829✔
119
  }
120
  SDB_SET_INT32(pRaw, dataPos, pVgroup->syncConfChangeVer, _OVER)
11,421,225✔
121
  SDB_SET_INT32(pRaw, dataPos, pVgroup->mountVgId, _OVER)
11,421,225✔
122
  SDB_SET_INT64(pRaw, dataPos, pVgroup->keepVersion, _OVER)
11,421,225✔
123
  SDB_SET_INT64(pRaw, dataPos, pVgroup->keepVersionTime, _OVER)
11,421,225✔
124
  SDB_SET_RESERVE(pRaw, dataPos, VGROUP_RESERVE_SIZE, _OVER)
11,421,225✔
125
  SDB_SET_DATALEN(pRaw, dataPos, _OVER)
11,421,225✔
126

127
  terrno = 0;
11,421,225✔
128

129
_OVER:
11,421,225✔
130
  if (terrno != 0) {
11,421,225✔
131
    mError("vgId:%d, failed to encode to raw:%p since %s", pVgroup->vgId, pRaw, terrstr());
×
132
    sdbFreeRaw(pRaw);
×
133
    return NULL;
×
134
  }
135

136
  mTrace("vgId:%d, encode to raw:%p, row:%p", pVgroup->vgId, pRaw, pVgroup);
11,421,225✔
137
  return pRaw;
11,421,225✔
138
}
139

140
SSdbRow *mndVgroupActionDecode(SSdbRaw *pRaw) {
10,772,220✔
141
  int32_t code = 0;
10,772,220✔
142
  int32_t lino = 0;
10,772,220✔
143
  terrno = TSDB_CODE_OUT_OF_MEMORY;
10,772,220✔
144
  SSdbRow *pRow = NULL;
10,772,220✔
145
  SVgObj  *pVgroup = NULL;
10,772,220✔
146

147
  int8_t sver = 0;
10,772,220✔
148
  if (sdbGetRawSoftVer(pRaw, &sver) != 0) goto _OVER;
10,772,220✔
149

150
  if (sver < 1 || sver > VGROUP_VER_NUMBER) {
10,772,220✔
151
    terrno = TSDB_CODE_SDB_INVALID_DATA_VER;
×
152
    goto _OVER;
×
153
  }
154

155
  pRow = sdbAllocRow(sizeof(SVgObj));
10,772,220✔
156
  if (pRow == NULL) goto _OVER;
10,772,220✔
157

158
  pVgroup = sdbGetRowObj(pRow);
10,772,220✔
159
  if (pVgroup == NULL) goto _OVER;
10,772,220✔
160

161
  int32_t dataPos = 0;
10,772,220✔
162
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->vgId, _OVER)
10,772,220✔
163
  SDB_GET_INT64(pRaw, dataPos, &pVgroup->createdTime, _OVER)
10,772,220✔
164
  SDB_GET_INT64(pRaw, dataPos, &pVgroup->updateTime, _OVER)
10,772,220✔
165
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->version, _OVER)
10,772,220✔
166
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->hashBegin, _OVER)
10,772,220✔
167
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->hashEnd, _OVER)
10,772,220✔
168
  SDB_GET_BINARY(pRaw, dataPos, pVgroup->dbName, TSDB_DB_FNAME_LEN, _OVER)
10,772,220✔
169
  SDB_GET_INT64(pRaw, dataPos, &pVgroup->dbUid, _OVER)
10,772,220✔
170
  SDB_GET_INT8(pRaw, dataPos, &pVgroup->isTsma, _OVER)
10,772,220✔
171
  SDB_GET_INT8(pRaw, dataPos, &pVgroup->replica, _OVER)
10,772,220✔
172
  for (int8_t i = 0; i < pVgroup->replica; ++i) {
24,155,510✔
173
    SVnodeGid *pVgid = &pVgroup->vnodeGid[i];
13,383,290✔
174
    SDB_GET_INT32(pRaw, dataPos, &pVgid->dnodeId, _OVER)
13,383,290✔
175
    if (pVgroup->replica == 1) {
13,383,290✔
176
      pVgid->syncState = TAOS_SYNC_STATE_LEADER;
9,399,275✔
177
    }
178
  }
179
  if (dataPos + 2 * sizeof(int32_t) + VGROUP_RESERVE_SIZE <= pRaw->dataLen) {
10,772,220✔
180
    SDB_GET_INT32(pRaw, dataPos, &pVgroup->syncConfChangeVer, _OVER)
10,772,220✔
181
  }
182
  SDB_GET_INT32(pRaw, dataPos, &pVgroup->mountVgId, _OVER)
10,772,220✔
183
  if (dataPos + sizeof(int64_t) + VGROUP_RESERVE_SIZE <= pRaw->dataLen) {
10,772,220✔
184
    SDB_GET_INT64(pRaw, dataPos, &pVgroup->keepVersion, _OVER)
10,772,220✔
185
  }
186
  if (dataPos + sizeof(int64_t) + VGROUP_RESERVE_SIZE <= pRaw->dataLen) {
10,772,220✔
187
    SDB_GET_INT64(pRaw, dataPos, &pVgroup->keepVersionTime, _OVER)
10,772,220✔
188
  }
189
  SDB_GET_RESERVE(pRaw, dataPos, VGROUP_RESERVE_SIZE, _OVER)
10,772,220✔
190

191
  terrno = 0;
10,772,220✔
192

193
_OVER:
10,772,220✔
194
  if (terrno != 0) {
10,772,220✔
195
    mError("vgId:%d, failed to decode from raw:%p since %s", pVgroup == NULL ? 0 : pVgroup->vgId, pRaw, terrstr());
×
196
    taosMemoryFreeClear(pRow);
×
197
    return NULL;
×
198
  }
199

200
  mTrace("vgId:%d, decode from raw:%p, row:%p", pVgroup->vgId, pRaw, pVgroup);
10,772,220✔
201
  return pRow;
10,772,220✔
202
}
203

204
static int32_t mndNewVgActionValidate(SMnode *pMnode, STrans *pTrans, SSdbRaw *pRaw) {
2,778,239✔
205
  SSdb    *pSdb = pMnode->pSdb;
2,778,239✔
206
  SSdbRow *pRow = NULL;
2,778,239✔
207
  SVgObj  *pVgroup = NULL;
2,778,239✔
208
  int      code = -1;
2,778,239✔
209

210
  pRow = mndVgroupActionDecode(pRaw);
2,778,239✔
211
  if (pRow == NULL) {
2,778,239✔
212
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
213
    if (terrno != 0) code = terrno;
×
214
    goto _OVER;
×
215
  }
216
  pVgroup = sdbGetRowObj(pRow);
2,778,239✔
217
  if (pVgroup == NULL) {
2,778,239✔
218
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
219
    if (terrno != 0) code = terrno;
×
220
    goto _OVER;
×
221
  }
222

223
  int32_t maxVgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
2,778,239✔
224
  if (maxVgId > pVgroup->vgId) {
2,778,239✔
225
    mError("trans:%d, vgroup id %d already in use. maxVgId:%d", pTrans->id, pVgroup->vgId, maxVgId);
×
226
    goto _OVER;
×
227
  }
228

229
  code = 0;
2,778,239✔
230
_OVER:
2,778,239✔
231
  if (pVgroup) mndVgroupActionDelete(pSdb, pVgroup);
2,778,239✔
232
  taosMemoryFreeClear(pRow);
2,778,239✔
233
  TAOS_RETURN(code);
2,778,239✔
234
}
235

236
static int32_t mndVgroupActionInsert(SSdb *pSdb, SVgObj *pVgroup) {
3,198,990✔
237
  mTrace("vgId:%d, perform insert action, row:%p", pVgroup->vgId, pVgroup);
3,198,990✔
238
  return 0;
3,198,990✔
239
}
240

241
static int32_t mndVgroupActionDelete(SSdb *pSdb, SVgObj *pVgroup) {
10,749,692✔
242
  mTrace("vgId:%d, perform delete action, row:%p", pVgroup->vgId, pVgroup);
10,749,692✔
243
  return 0;
10,749,692✔
244
}
245

246
static int32_t mndVgroupActionUpdate(SSdb *pSdb, SVgObj *pOld, SVgObj *pNew) {
3,255,864✔
247
  mTrace("vgId:%d, perform update action, old row:%p new row:%p", pOld->vgId, pOld, pNew);
3,255,864✔
248
  pOld->updateTime = pNew->updateTime;
3,255,864✔
249
  pOld->version = pNew->version;
3,255,864✔
250
  pOld->hashBegin = pNew->hashBegin;
3,255,864✔
251
  pOld->hashEnd = pNew->hashEnd;
3,255,864✔
252
  pOld->replica = pNew->replica;
3,255,864✔
253
  pOld->isTsma = pNew->isTsma;
3,255,864✔
254
  pOld->keepVersion = pNew->keepVersion;
3,255,864✔
255
  pOld->keepVersionTime = pNew->keepVersionTime;
3,255,864✔
256
  for (int32_t i = 0; i < pNew->replica; ++i) {
7,725,339✔
257
    SVnodeGid *pNewGid = &pNew->vnodeGid[i];
4,469,475✔
258
    for (int32_t j = 0; j < pOld->replica; ++j) {
12,594,062✔
259
      SVnodeGid *pOldGid = &pOld->vnodeGid[j];
8,124,587✔
260
      if (pNewGid->dnodeId == pOldGid->dnodeId) {
8,124,587✔
261
        pNewGid->syncState = pOldGid->syncState;
4,227,510✔
262
        pNewGid->syncRestore = pOldGid->syncRestore;
4,227,510✔
263
        pNewGid->syncCanRead = pOldGid->syncCanRead;
4,227,510✔
264
        pNewGid->syncAppliedIndex = pOldGid->syncAppliedIndex;
4,227,510✔
265
        pNewGid->syncCommitIndex = pOldGid->syncCommitIndex;
4,227,510✔
266
        pNewGid->bufferSegmentUsed = pOldGid->bufferSegmentUsed;
4,227,510✔
267
        pNewGid->bufferSegmentSize = pOldGid->bufferSegmentSize;
4,227,510✔
268
      }
269
    }
270
  }
271
  pNew->numOfTables = pOld->numOfTables;
3,255,864✔
272
  pNew->numOfTimeSeries = pOld->numOfTimeSeries;
3,255,864✔
273
  pNew->totalStorage = pOld->totalStorage;
3,255,864✔
274
  pNew->compStorage = pOld->compStorage;
3,255,864✔
275
  pNew->pointsWritten = pOld->pointsWritten;
3,255,864✔
276
  pNew->compact = pOld->compact;
3,255,864✔
277
  memcpy(pOld->vnodeGid, pNew->vnodeGid, (TSDB_MAX_REPLICA + TSDB_MAX_LEARNER_REPLICA) * sizeof(SVnodeGid));
3,255,864✔
278
  pOld->syncConfChangeVer = pNew->syncConfChangeVer;
3,255,864✔
279
  tstrncpy(pOld->dbName, pNew->dbName, TSDB_DB_FNAME_LEN);
3,255,864✔
280
  return 0;
3,255,864✔
281
}
282

283
SVgObj *mndAcquireVgroup(SMnode *pMnode, int32_t vgId) {
113,352,597✔
284
  SSdb   *pSdb = pMnode->pSdb;
113,352,597✔
285
  SVgObj *pVgroup = sdbAcquire(pSdb, SDB_VGROUP, &vgId);
113,352,597✔
286
  if (pVgroup == NULL && terrno == TSDB_CODE_SDB_OBJ_NOT_THERE) {
113,352,597✔
287
    terrno = TSDB_CODE_MND_VGROUP_NOT_EXIST;
223,382✔
288
  }
289
  return pVgroup;
113,352,597✔
290
}
291

292
void mndReleaseVgroup(SMnode *pMnode, SVgObj *pVgroup) {
113,285,246✔
293
  SSdb *pSdb = pMnode->pSdb;
113,285,246✔
294
  sdbRelease(pSdb, pVgroup);
113,285,246✔
295
}
113,285,246✔
296

297
void *mndBuildCreateVnodeReq(SMnode *pMnode, SDnodeObj *pDnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen) {
3,004,500✔
298
  SCreateVnodeReq createReq = {0};
3,004,500✔
299
  createReq.vgId = pVgroup->vgId;
3,004,500✔
300
  memcpy(createReq.db, pDb->name, TSDB_DB_FNAME_LEN);
3,004,500✔
301
  createReq.dbUid = pDb->uid;
3,004,500✔
302
  createReq.vgVersion = pVgroup->version;
3,004,500✔
303
  createReq.numOfStables = pDb->cfg.numOfStables;
3,004,500✔
304
  createReq.buffer = pDb->cfg.buffer;
3,004,500✔
305
  createReq.pageSize = pDb->cfg.pageSize;
3,004,500✔
306
  createReq.pages = pDb->cfg.pages;
3,004,500✔
307
  createReq.cacheLastSize = pDb->cfg.cacheLastSize;
3,004,500✔
308
  createReq.daysPerFile = pDb->cfg.daysPerFile;
3,004,500✔
309
  createReq.daysToKeep0 = pDb->cfg.daysToKeep0;
3,004,500✔
310
  createReq.daysToKeep1 = pDb->cfg.daysToKeep1;
3,004,500✔
311
  createReq.daysToKeep2 = pDb->cfg.daysToKeep2;
3,004,500✔
312
  createReq.keepTimeOffset = pDb->cfg.keepTimeOffset;
3,004,500✔
313
  createReq.ssChunkSize = pDb->cfg.ssChunkSize;
3,004,500✔
314
  createReq.ssKeepLocal = pDb->cfg.ssKeepLocal;
3,004,500✔
315
  createReq.ssCompact = pDb->cfg.ssCompact;
3,004,500✔
316
  createReq.minRows = pDb->cfg.minRows;
3,004,500✔
317
  createReq.maxRows = pDb->cfg.maxRows;
3,004,500✔
318
  createReq.walFsyncPeriod = pDb->cfg.walFsyncPeriod;
3,004,500✔
319
  createReq.walLevel = pDb->cfg.walLevel;
3,004,500✔
320
  createReq.precision = pDb->cfg.precision;
3,004,500✔
321
  createReq.compression = pDb->cfg.compression;
3,004,500✔
322
  createReq.strict = pDb->cfg.strict;
3,004,500✔
323
  createReq.cacheLast = pDb->cfg.cacheLast;
3,004,500✔
324
  createReq.replica = 0;
3,004,500✔
325
  createReq.learnerReplica = 0;
3,004,500✔
326
  createReq.selfIndex = -1;
3,004,500✔
327
  createReq.learnerSelfIndex = -1;
3,004,500✔
328
  createReq.hashBegin = pVgroup->hashBegin;
3,004,500✔
329
  createReq.hashEnd = pVgroup->hashEnd;
3,004,500✔
330
  createReq.hashMethod = pDb->cfg.hashMethod;
3,004,500✔
331
  createReq.numOfRetensions = pDb->cfg.numOfRetensions;
3,004,500✔
332
  createReq.pRetensions = pDb->cfg.pRetensions;
3,004,500✔
333
  createReq.isTsma = pVgroup->isTsma;
3,004,500✔
334
  createReq.pTsma = pVgroup->pTsma;
3,004,500✔
335
  createReq.walRetentionPeriod = pDb->cfg.walRetentionPeriod;
3,004,500✔
336
  createReq.walRetentionSize = pDb->cfg.walRetentionSize;
3,004,500✔
337
  createReq.walRollPeriod = pDb->cfg.walRollPeriod;
3,004,500✔
338
  createReq.walSegmentSize = pDb->cfg.walSegmentSize;
3,004,500✔
339
  createReq.sstTrigger = pDb->cfg.sstTrigger;
3,004,500✔
340
  createReq.hashPrefix = pDb->cfg.hashPrefix;
3,004,500✔
341
  createReq.hashSuffix = pDb->cfg.hashSuffix;
3,004,500✔
342
  createReq.tsdbPageSize = pDb->cfg.tsdbPageSize;
3,004,500✔
343
  createReq.changeVersion = ++(pVgroup->syncConfChangeVer);
3,004,500✔
344
  createReq.encryptAlgorithm = pDb->cfg.encryptAlgorithm;
3,004,500✔
345
  int32_t code = 0;
3,004,500✔
346

347
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
7,277,199✔
348
    SReplica *pReplica = NULL;
4,272,699✔
349

350
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
4,272,699✔
351
      pReplica = &createReq.replicas[createReq.replica];
4,159,215✔
352
    } else {
353
      pReplica = &createReq.learnerReplicas[createReq.learnerReplica];
113,484✔
354
    }
355

356
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
4,272,699✔
357
    SDnodeObj *pVgidDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
4,272,699✔
358
    if (pVgidDnode == NULL) {
4,272,699✔
359
      return NULL;
×
360
    }
361

362
    pReplica->id = pVgidDnode->id;
4,272,699✔
363
    pReplica->port = pVgidDnode->port;
4,272,699✔
364
    memcpy(pReplica->fqdn, pVgidDnode->fqdn, TSDB_FQDN_LEN);
4,272,699✔
365
    mndReleaseDnode(pMnode, pVgidDnode);
4,272,699✔
366

367
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
4,272,699✔
368
      if (pDnode->id == pVgid->dnodeId) {
4,159,215✔
369
        createReq.selfIndex = createReq.replica;
2,891,016✔
370
      }
371
    } else {
372
      if (pDnode->id == pVgid->dnodeId) {
113,484✔
373
        createReq.learnerSelfIndex = createReq.learnerReplica;
113,484✔
374
      }
375
    }
376

377
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
4,272,699✔
378
      createReq.replica++;
4,159,215✔
379
    } else {
380
      createReq.learnerReplica++;
113,484✔
381
    }
382
  }
383

384
  if (createReq.selfIndex == -1 && createReq.learnerSelfIndex == -1) {
3,004,500✔
385
    terrno = TSDB_CODE_APP_ERROR;
×
386
    return NULL;
×
387
  }
388

389
  createReq.changeVersion = pVgroup->syncConfChangeVer;
3,004,500✔
390

391
  mInfo(
3,004,500✔
392
      "vgId:%d, build create vnode req, replica:%d selfIndex:%d learnerReplica:%d learnerSelfIndex:%d strict:%d "
393
      "changeVersion:%d",
394
      createReq.vgId, createReq.replica, createReq.selfIndex, createReq.learnerReplica, createReq.learnerSelfIndex,
395
      createReq.strict, createReq.changeVersion);
396
  for (int32_t i = 0; i < createReq.replica; ++i) {
7,163,715✔
397
    mInfo("vgId:%d, replica:%d ep:%s:%u", createReq.vgId, i, createReq.replicas[i].fqdn, createReq.replicas[i].port);
4,159,215✔
398
  }
399
  for (int32_t i = 0; i < createReq.learnerReplica; ++i) {
3,117,984✔
400
    mInfo("vgId:%d, replica:%d ep:%s:%u", createReq.vgId, i, createReq.learnerReplicas[i].fqdn,
113,484✔
401
          createReq.learnerReplicas[i].port);
402
  }
403

404
  int32_t contLen = tSerializeSCreateVnodeReq(NULL, 0, &createReq);
3,004,500✔
405
  if (contLen < 0) {
3,004,500✔
406
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
407
    return NULL;
×
408
  }
409

410
  void *pReq = taosMemoryMalloc(contLen);
3,004,500✔
411
  if (pReq == NULL) {
3,004,500✔
412
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
413
    return NULL;
×
414
  }
415

416
  code = tSerializeSCreateVnodeReq(pReq, contLen, &createReq);
3,004,500✔
417
  if (code < 0) {
3,004,500✔
418
    terrno = TSDB_CODE_APP_ERROR;
×
419
    taosMemoryFree(pReq);
×
420
    mError("vgId:%d, failed to serialize create vnode req,since %s", createReq.vgId, terrstr());
×
421
    return NULL;
×
422
  }
423
  *pContLen = contLen;
3,004,500✔
424
  return pReq;
3,004,500✔
425
}
426

427
static void *mndBuildAlterVnodeConfigReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen) {
208,644✔
428
  SAlterVnodeConfigReq alterReq = {0};
208,644✔
429
  alterReq.vgVersion = pVgroup->version;
208,644✔
430
  alterReq.buffer = pDb->cfg.buffer;
208,644✔
431
  alterReq.pageSize = pDb->cfg.pageSize;
208,644✔
432
  alterReq.pages = pDb->cfg.pages;
208,644✔
433
  alterReq.cacheLastSize = pDb->cfg.cacheLastSize;
208,644✔
434
  alterReq.daysPerFile = pDb->cfg.daysPerFile;
208,644✔
435
  alterReq.daysToKeep0 = pDb->cfg.daysToKeep0;
208,644✔
436
  alterReq.daysToKeep1 = pDb->cfg.daysToKeep1;
208,644✔
437
  alterReq.daysToKeep2 = pDb->cfg.daysToKeep2;
208,644✔
438
  alterReq.keepTimeOffset = pDb->cfg.keepTimeOffset;
208,644✔
439
  alterReq.walFsyncPeriod = pDb->cfg.walFsyncPeriod;
208,644✔
440
  alterReq.walLevel = pDb->cfg.walLevel;
208,644✔
441
  alterReq.strict = pDb->cfg.strict;
208,644✔
442
  alterReq.cacheLast = pDb->cfg.cacheLast;
208,644✔
443
  alterReq.sttTrigger = pDb->cfg.sstTrigger;
208,644✔
444
  alterReq.minRows = pDb->cfg.minRows;
208,644✔
445
  alterReq.walRetentionPeriod = pDb->cfg.walRetentionPeriod;
208,644✔
446
  alterReq.walRetentionSize = pDb->cfg.walRetentionSize;
208,644✔
447
  alterReq.ssKeepLocal = pDb->cfg.ssKeepLocal;
208,644✔
448
  alterReq.ssCompact = pDb->cfg.ssCompact;
208,644✔
449

450
  mInfo("vgId:%d, build alter vnode config req", pVgroup->vgId);
208,644✔
451
  int32_t contLen = tSerializeSAlterVnodeConfigReq(NULL, 0, &alterReq);
208,644✔
452
  if (contLen < 0) {
208,644✔
453
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
454
    return NULL;
×
455
  }
456
  contLen += sizeof(SMsgHead);
208,644✔
457

458
  void *pReq = taosMemoryMalloc(contLen);
208,644✔
459
  if (pReq == NULL) {
208,644✔
460
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
461
    return NULL;
×
462
  }
463

464
  SMsgHead *pHead = pReq;
208,644✔
465
  pHead->contLen = htonl(contLen);
208,644✔
466
  pHead->vgId = htonl(pVgroup->vgId);
208,644✔
467

468
  if (tSerializeSAlterVnodeConfigReq((char *)pReq + sizeof(SMsgHead), contLen, &alterReq) < 0) {
208,644✔
469
    taosMemoryFree(pReq);
×
470
    mError("vgId:%d, failed to serialize alter vnode config req,since %s", pVgroup->vgId, terrstr());
×
471
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
472
    return NULL;
×
473
  }
474
  *pContLen = contLen;
208,644✔
475
  return pReq;
208,644✔
476
}
477

478
static void *mndBuildAlterVnodeReplicaReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId,
826,795✔
479
                                          int32_t *pContLen) {
480
  SAlterVnodeReplicaReq alterReq = {
1,653,590✔
481
      .vgId = pVgroup->vgId,
826,795✔
482
      .strict = pDb->cfg.strict,
826,795✔
483
      .replica = 0,
484
      .learnerReplica = 0,
485
      .selfIndex = -1,
486
      .learnerSelfIndex = -1,
487
      .changeVersion = ++(pVgroup->syncConfChangeVer),
1,653,590✔
488
  };
489

490
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
3,342,041✔
491
    SReplica *pReplica = NULL;
2,515,246✔
492

493
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
2,515,246✔
494
      pReplica = &alterReq.replicas[alterReq.replica];
2,321,349✔
495
      alterReq.replica++;
2,321,349✔
496
    } else {
497
      pReplica = &alterReq.learnerReplicas[alterReq.learnerReplica];
193,897✔
498
      alterReq.learnerReplica++;
193,897✔
499
    }
500

501
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
2,515,246✔
502
    SDnodeObj *pVgidDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
2,515,246✔
503
    if (pVgidDnode == NULL) return NULL;
2,515,246✔
504

505
    pReplica->id = pVgidDnode->id;
2,515,246✔
506
    pReplica->port = pVgidDnode->port;
2,515,246✔
507
    memcpy(pReplica->fqdn, pVgidDnode->fqdn, TSDB_FQDN_LEN);
2,515,246✔
508
    mndReleaseDnode(pMnode, pVgidDnode);
2,515,246✔
509

510
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
2,515,246✔
511
      if (dnodeId == pVgid->dnodeId) {
2,321,349✔
512
        alterReq.selfIndex = v;
826,795✔
513
      }
514
    } else {
515
      if (dnodeId == pVgid->dnodeId) {
193,897✔
516
        alterReq.learnerSelfIndex = v;
×
517
      }
518
    }
519
  }
520

521
  mInfo(
826,795✔
522
      "vgId:%d, build alter vnode req, replica:%d selfIndex:%d learnerReplica:%d learnerSelfIndex:%d strict:%d "
523
      "changeVersion:%d",
524
      alterReq.vgId, alterReq.replica, alterReq.selfIndex, alterReq.learnerReplica, alterReq.learnerSelfIndex,
525
      alterReq.strict, alterReq.changeVersion);
526
  for (int32_t i = 0; i < alterReq.replica; ++i) {
3,148,144✔
527
    mInfo("vgId:%d, replica:%d ep:%s:%u", alterReq.vgId, i, alterReq.replicas[i].fqdn, alterReq.replicas[i].port);
2,321,349✔
528
  }
529
  for (int32_t i = 0; i < alterReq.learnerReplica; ++i) {
1,020,692✔
530
    mInfo("vgId:%d, learnerReplica:%d ep:%s:%u", alterReq.vgId, i, alterReq.learnerReplicas[i].fqdn,
193,897✔
531
          alterReq.learnerReplicas[i].port);
532
  }
533

534
  if (alterReq.selfIndex == -1 && alterReq.learnerSelfIndex == -1) {
826,795✔
535
    terrno = TSDB_CODE_APP_ERROR;
×
536
    return NULL;
×
537
  }
538

539
  int32_t contLen = tSerializeSAlterVnodeReplicaReq(NULL, 0, &alterReq);
826,795✔
540
  if (contLen < 0) {
826,795✔
541
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
542
    return NULL;
×
543
  }
544

545
  void *pReq = taosMemoryMalloc(contLen);
826,795✔
546
  if (pReq == NULL) {
826,795✔
547
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
548
    return NULL;
×
549
  }
550

551
  if (tSerializeSAlterVnodeReplicaReq(pReq, contLen, &alterReq) < 0) {
826,795✔
552
    mError("vgId:%d, failed to serialize alter vnode req,since %s", alterReq.vgId, terrstr());
×
553
    taosMemoryFree(pReq);
×
554
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
555
    return NULL;
×
556
  }
557
  *pContLen = contLen;
826,795✔
558
  return pReq;
826,795✔
559
}
560

561
static void *mndBuildCheckLearnCatchupReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId,
×
562
                                          int32_t *pContLen) {
563
  SCheckLearnCatchupReq req = {
×
564
      .vgId = pVgroup->vgId,
×
565
      .strict = pDb->cfg.strict,
×
566
      .replica = 0,
567
      .learnerReplica = 0,
568
      .selfIndex = -1,
569
      .learnerSelfIndex = -1,
570
  };
571

572
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
×
573
    SReplica *pReplica = NULL;
×
574

575
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
×
576
      pReplica = &req.replicas[req.replica];
×
577
      req.replica++;
×
578
    } else {
579
      pReplica = &req.learnerReplicas[req.learnerReplica];
×
580
      req.learnerReplica++;
×
581
    }
582

583
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
×
584
    SDnodeObj *pVgidDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
×
585
    if (pVgidDnode == NULL) return NULL;
×
586

587
    pReplica->id = pVgidDnode->id;
×
588
    pReplica->port = pVgidDnode->port;
×
589
    memcpy(pReplica->fqdn, pVgidDnode->fqdn, TSDB_FQDN_LEN);
×
590
    mndReleaseDnode(pMnode, pVgidDnode);
×
591

592
    if (pVgroup->vnodeGid[v].nodeRole == TAOS_SYNC_ROLE_VOTER) {
×
593
      if (dnodeId == pVgid->dnodeId) {
×
594
        req.selfIndex = v;
×
595
      }
596
    } else {
597
      if (dnodeId == pVgid->dnodeId) {
×
598
        req.learnerSelfIndex = v;
×
599
      }
600
    }
601
  }
602

603
  mInfo("vgId:%d, build alter vnode req, replica:%d selfIndex:%d learnerReplica:%d learnerSelfIndex:%d strict:%d",
×
604
        req.vgId, req.replica, req.selfIndex, req.learnerReplica, req.learnerSelfIndex, req.strict);
605
  for (int32_t i = 0; i < req.replica; ++i) {
×
606
    mInfo("vgId:%d, replica:%d ep:%s:%u", req.vgId, i, req.replicas[i].fqdn, req.replicas[i].port);
×
607
  }
608
  for (int32_t i = 0; i < req.learnerReplica; ++i) {
×
609
    mInfo("vgId:%d, learnerReplica:%d ep:%s:%u", req.vgId, i, req.learnerReplicas[i].fqdn, req.learnerReplicas[i].port);
×
610
  }
611

612
  if (req.selfIndex == -1 && req.learnerSelfIndex == -1) {
×
613
    terrno = TSDB_CODE_APP_ERROR;
×
614
    return NULL;
×
615
  }
616

617
  int32_t contLen = tSerializeSAlterVnodeReplicaReq(NULL, 0, &req);
×
618
  if (contLen < 0) {
×
619
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
620
    return NULL;
×
621
  }
622

623
  void *pReq = taosMemoryMalloc(contLen);
×
624
  if (pReq == NULL) {
×
625
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
626
    return NULL;
×
627
  }
628

629
  if (tSerializeSAlterVnodeReplicaReq(pReq, contLen, &req) < 0) {
×
630
    mError("vgId:%d, failed to serialize alter vnode req,since %s", req.vgId, terrstr());
×
631
    taosMemoryFree(pReq);
×
632
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
633
    return NULL;
×
634
  }
635
  *pContLen = contLen;
×
636
  return pReq;
×
637
}
638

639
static void *mndBuildDisableVnodeWriteReq(SMnode *pMnode, SDbObj *pDb, int32_t vgId, int32_t *pContLen) {
30,266✔
640
  SDisableVnodeWriteReq disableReq = {
30,266✔
641
      .vgId = vgId,
642
      .disable = 1,
643
  };
644

645
  mInfo("vgId:%d, build disable vnode write req", vgId);
30,266✔
646
  int32_t contLen = tSerializeSDisableVnodeWriteReq(NULL, 0, &disableReq);
30,266✔
647
  if (contLen < 0) {
30,266✔
648
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
649
    return NULL;
×
650
  }
651

652
  void *pReq = taosMemoryMalloc(contLen);
30,266✔
653
  if (pReq == NULL) {
30,266✔
654
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
655
    return NULL;
×
656
  }
657

658
  if (tSerializeSDisableVnodeWriteReq(pReq, contLen, &disableReq) < 0) {
30,266✔
659
    mError("vgId:%d, failed to serialize disable vnode write req,since %s", vgId, terrstr());
×
660
    taosMemoryFree(pReq);
×
661
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
662
    return NULL;
×
663
  }
664
  *pContLen = contLen;
30,266✔
665
  return pReq;
30,266✔
666
}
667

668
static void *mndBuildAlterVnodeHashRangeReq(SMnode *pMnode, int32_t srcVgId, SVgObj *pVgroup, int32_t *pContLen) {
30,266✔
669
  SAlterVnodeHashRangeReq alterReq = {
60,532✔
670
      .srcVgId = srcVgId,
671
      .dstVgId = pVgroup->vgId,
30,266✔
672
      .hashBegin = pVgroup->hashBegin,
30,266✔
673
      .hashEnd = pVgroup->hashEnd,
30,266✔
674
      .changeVersion = ++(pVgroup->syncConfChangeVer),
60,532✔
675
  };
676

677
  mInfo("vgId:%d, build alter vnode hashrange req, dstVgId:%d, hashrange:[%u, %u]", srcVgId, pVgroup->vgId,
30,266✔
678
        pVgroup->hashBegin, pVgroup->hashEnd);
679
  int32_t contLen = tSerializeSAlterVnodeHashRangeReq(NULL, 0, &alterReq);
30,266✔
680
  if (contLen < 0) {
30,266✔
681
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
682
    return NULL;
×
683
  }
684

685
  void *pReq = taosMemoryMalloc(contLen);
30,266✔
686
  if (pReq == NULL) {
30,266✔
687
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
688
    return NULL;
×
689
  }
690

691
  if (tSerializeSAlterVnodeHashRangeReq(pReq, contLen, &alterReq) < 0) {
30,266✔
692
    mError("vgId:%d, failed to serialize alter vnode hashrange req,since %s", srcVgId, terrstr());
×
693
    taosMemoryFree(pReq);
×
694
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
695
    return NULL;
×
696
  }
697
  *pContLen = contLen;
30,266✔
698
  return pReq;
30,266✔
699
}
700

701
void *mndBuildDropVnodeReq(SMnode *pMnode, SDnodeObj *pDnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen) {
4,465,971✔
702
  SDropVnodeReq dropReq = {0};
4,465,971✔
703
  dropReq.dnodeId = pDnode->id;
4,465,971✔
704
  dropReq.vgId = pVgroup->vgId;
4,465,971✔
705
  memcpy(dropReq.db, pDb->name, TSDB_DB_FNAME_LEN);
4,465,971✔
706
  dropReq.dbUid = pDb->uid;
4,465,971✔
707

708
  mInfo("vgId:%d, build drop vnode req", dropReq.vgId);
4,465,971✔
709
  int32_t contLen = tSerializeSDropVnodeReq(NULL, 0, &dropReq);
4,465,971✔
710
  if (contLen < 0) {
4,465,971✔
711
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
712
    return NULL;
×
713
  }
714

715
  void *pReq = taosMemoryMalloc(contLen);
4,465,971✔
716
  if (pReq == NULL) {
4,465,971✔
717
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
718
    return NULL;
×
719
  }
720

721
  if (tSerializeSDropVnodeReq(pReq, contLen, &dropReq) < 0) {
4,465,971✔
722
    mError("vgId:%d, failed to serialize drop vnode req,since %s", dropReq.vgId, terrstr());
×
723
    taosMemoryFree(pReq);
×
724
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
725
    return NULL;
×
726
  }
727
  *pContLen = contLen;
4,465,971✔
728
  return pReq;
4,465,971✔
729
}
730

731
static bool mndResetDnodesArrayFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
1,987,472✔
732
  SDnodeObj *pDnode = pObj;
1,987,472✔
733
  pDnode->numOfVnodes = 0;
1,987,472✔
734
  pDnode->numOfOtherNodes = 0;
1,987,472✔
735
  return true;
1,987,472✔
736
}
737

738
static bool mndBuildDnodesArrayFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
1,987,472✔
739
  SDnodeObj *pDnode = pObj;
1,987,472✔
740
  SArray    *pArray = p1;
1,987,472✔
741
  int32_t    exceptDnodeId = *(int32_t *)p2;
1,987,472✔
742
  SArray    *dnodeList = p3;
1,987,472✔
743

744
  if (exceptDnodeId == pDnode->id) {
1,987,472✔
745
    return true;
8,317✔
746
  }
747

748
  if (dnodeList != NULL) {
1,979,155✔
749
    int32_t dnodeListSize = taosArrayGetSize(dnodeList);
71,440✔
750
    if (dnodeListSize > 0) {
71,440✔
751
      bool inDnodeList = false;
71,440✔
752
      for (int32_t index = 0; index < dnodeListSize; ++index) {
233,120✔
753
        int32_t dnodeId = *(int32_t *)taosArrayGet(dnodeList, index);
161,680✔
754
        if (pDnode->id == dnodeId) {
161,680✔
755
          inDnodeList = true;
32,336✔
756
        }
757
      }
758
      if (!inDnodeList) {
71,440✔
759
        return true;
39,104✔
760
      }
761
    } else {
762
      return true;  // TS-6191
×
763
    }
764
  }
765

766
  int64_t curMs = taosGetTimestampMs();
1,940,051✔
767
  bool    online = mndIsDnodeOnline(pDnode, curMs);
1,940,051✔
768
  bool    isMnode = mndIsMnode(pMnode, pDnode->id);
1,940,051✔
769
  pDnode->numOfVnodes = mndGetVnodesNum(pMnode, pDnode->id);
1,940,051✔
770
  pDnode->memUsed = mndGetVnodesMemory(pMnode, pDnode->id);
1,940,051✔
771

772
  mInfo("dnode:%d, vnodes:%d supportVnodes:%d isMnode:%d online:%d memory avail:%" PRId64 " used:%" PRId64, pDnode->id,
1,940,051✔
773
        pDnode->numOfVnodes, pDnode->numOfSupportVnodes, isMnode, online, pDnode->memAvail, pDnode->memUsed);
774

775
  if (isMnode) {
1,940,051✔
776
    pDnode->numOfOtherNodes++;
1,398,951✔
777
  }
778

779
  if (online && pDnode->numOfSupportVnodes > 0) {
1,940,051✔
780
    if (taosArrayPush(pArray, pDnode) == NULL) return false;
1,893,036✔
781
  }
782
  return true;
1,940,051✔
783
}
784

785
static bool isDnodeInList(SArray *dnodeList, int32_t dnodeId) {
×
786
  int32_t dnodeListSize = taosArrayGetSize(dnodeList);
×
787
  for (int32_t i = 0; i < dnodeListSize; ++i) {
×
788
    int32_t id = *(int32_t *)TARRAY_GET_ELEM(dnodeList, i);
×
789
    if (id == dnodeId) {
×
790
      return true;
×
791
    }
792
  }
793
  return false;
×
794
}
795

796
#ifdef TD_ENTERPRISE
797
static float mndGetDnodeScore1(SDnodeObj *pDnode, int32_t additionDnodes, float ratio) {
×
798
  float totalDnodes = pDnode->numOfVnodes + (float)pDnode->numOfOtherNodes * ratio + additionDnodes;
×
799
  float result = totalDnodes / pDnode->numOfSupportVnodes;
×
800
  return pDnode->numOfVnodes > 0 ? -result : result;
×
801
}
802

803
static int32_t mndCompareDnodeVnodes1(SDnodeObj *pDnode1, SDnodeObj *pDnode2) {
×
804
  float d1Score = mndGetDnodeScore1(pDnode1, 0, 0.9);
×
805
  float d2Score = mndGetDnodeScore1(pDnode2, 0, 0.9);
×
806
  if (d1Score == d2Score) {
×
807
    if (pDnode1->id == pDnode2->id) {
×
808
      return 0;
×
809
    }
810
    return pDnode1->id > pDnode2->id ? 1 : -1;
×
811
  }
812
  return d1Score > d2Score ? 1 : -1;
×
813
}
814

815
static bool mndBuildDnodesListFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
×
816
  SDnodeObj *pDnode = pObj;
×
817
  SArray    *pArray = p1;
×
818

819
  bool isMnode = mndIsMnode(pMnode, pDnode->id);
×
820
  pDnode->numOfVnodes = mndGetVnodesNum(pMnode, pDnode->id);
×
821

822
  if (isMnode) {
×
823
    pDnode->numOfOtherNodes++;
×
824
  }
825

826
  if (pDnode->numOfSupportVnodes > 0) {
×
827
    if (taosArrayPush(pArray, pDnode) == NULL) return false;
×
828
  }
829
  return true;
×
830
}
831

832
// TS-6191
833
static int32_t mndBuildNodesCheckDualReplica(SMnode *pMnode, int32_t nDnodes, SArray *dnodeList, SArray **ppDnodeList) {
1,331,371✔
834
  int32_t code = 0;
1,331,371✔
835
  if (!grantCheckDualReplicaDnodes(pMnode)) {
1,331,371✔
836
    TAOS_RETURN(code);
1,331,371✔
837
  }
838
  SSdb   *pSdb = pMnode->pSdb;
×
839
  SArray *pArray = taosArrayInit(nDnodes, sizeof(SDnodeObj));
×
840
  if (pArray == NULL) {
×
841
    TAOS_RETURN(code = terrno);
×
842
  }
843
  *ppDnodeList = pArray;
×
844

845
  sdbTraverse(pSdb, SDB_DNODE, mndResetDnodesArrayFp, NULL, NULL, NULL);
×
846
  sdbTraverse(pSdb, SDB_DNODE, mndBuildDnodesListFp, pArray, NULL, NULL);
×
847

848
  int32_t arrSize = taosArrayGetSize(pArray);
×
849
  if (arrSize <= 0) {
×
850
    TAOS_RETURN(code);
×
851
  }
852
  if (arrSize > 1) taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes1);
×
853

854
  int32_t dnodeListSize = taosArrayGetSize(dnodeList);
×
855
  if (dnodeListSize <= 0) {
×
856
    if (arrSize > 2) taosArrayRemoveBatch(pArray, 2, arrSize - 2, NULL);
×
857
  } else {
858
    int32_t nDnodesWithVnodes = 0;
×
859
    for (int32_t i = 0; i < arrSize; ++i) {
×
860
      SDnodeObj *pDnode = TARRAY_GET_ELEM(pArray, i);
×
861
      if (pDnode->numOfVnodes <= 0) {
×
862
        break;
×
863
      }
864
      ++nDnodesWithVnodes;
×
865
    }
866
    int32_t dnodeId = -1;
×
867
    if (nDnodesWithVnodes == 1) {
×
868
      dnodeId = ((SDnodeObj *)TARRAY_GET_ELEM(pArray, 0))->id;
×
869
    } else if (nDnodesWithVnodes >= 2) {
×
870
      // must select the dnodes from the 1st 2 dnodes
871
      taosArrayRemoveBatch(pArray, 2, arrSize - 2, NULL);
×
872
    }
873
    for (int32_t i = 0; i < TARRAY_SIZE(pArray);) {
×
874
      SDnodeObj *pDnode = taosArrayGet(pArray, i);
×
875
      if (!isDnodeInList(dnodeList, pDnode->id)) {
×
876
        taosArrayRemove(pArray, i);
×
877
        continue;
×
878
      }
879
      ++i;
×
880
    }
881
    if (nDnodesWithVnodes == 1) {
×
882
      SDnodeObj *pDnode = taosArrayGet(pArray, 0);
×
883
      if (pDnode && (pDnode->id != dnodeId)) {  // the first dnode is not in dnodeList, remove the last element
×
884
        taosArrayRemove(pArray, taosArrayGetSize(pArray) - 1);
×
885
      }
886
    }
887
  }
888

889
  TAOS_RETURN(code);
×
890
}
891
#endif
892

893
SArray *mndBuildDnodesArray(SMnode *pMnode, int32_t exceptDnodeId, SArray *dnodeList) {
1,331,371✔
894
  SSdb   *pSdb = pMnode->pSdb;
1,331,371✔
895
  int32_t numOfDnodes = mndGetDnodeSize(pMnode);
1,331,371✔
896
  SArray *tDnodeList = NULL;
1,331,371✔
897
  SArray *pDnodeList = NULL;
1,331,371✔
898

899
  SArray *pArray = taosArrayInit(numOfDnodes, sizeof(SDnodeObj));
1,331,371✔
900
  if (pArray == NULL) {
1,331,371✔
901
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
902
    return NULL;
×
903
  }
904
  if (taosArrayGetSize(dnodeList) > 0) {
1,331,371✔
905
    tDnodeList = dnodeList;
14,288✔
906
  }
907
#ifdef TD_ENTERPRISE
908
  if (0 != mndBuildNodesCheckDualReplica(pMnode, numOfDnodes, tDnodeList, &pDnodeList)) {
1,331,371✔
909
    taosArrayDestroy(pArray);
×
910
    return NULL;
×
911
  }
912
#endif
913
  sdbTraverse(pSdb, SDB_DNODE, mndResetDnodesArrayFp, NULL, NULL, NULL);
1,331,371✔
914
  sdbTraverse(pSdb, SDB_DNODE, mndBuildDnodesArrayFp, pArray, &exceptDnodeId, pDnodeList ? pDnodeList : tDnodeList);
1,331,371✔
915

916
  mDebug("build %d dnodes array", (int32_t)taosArrayGetSize(pArray));
1,331,371✔
917
  for (int32_t i = 0; i < (int32_t)taosArrayGetSize(pArray); ++i) {
3,224,407✔
918
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
1,893,036✔
919
    mDebug("dnode:%d, vnodes:%d others:%d", pDnode->id, pDnode->numOfVnodes, pDnode->numOfOtherNodes);
1,893,036✔
920
  }
921
  taosArrayDestroy(pDnodeList);
1,331,371✔
922
  return pArray;
1,331,371✔
923
}
924

925
static int32_t mndCompareDnodeId(int32_t *dnode1Id, int32_t *dnode2Id) {
×
926
  if (*dnode1Id == *dnode2Id) {
×
927
    return 0;
×
928
  }
929
  return *dnode1Id > *dnode2Id ? 1 : -1;
×
930
}
931

932
static float mndGetDnodeScore(SDnodeObj *pDnode, int32_t additionDnodes, float ratio) {
10,935,090✔
933
  float totalDnodes = pDnode->numOfVnodes + (float)pDnode->numOfOtherNodes * ratio + additionDnodes;
10,935,090✔
934
  return totalDnodes / pDnode->numOfSupportVnodes;
10,935,090✔
935
}
936

937
static int32_t mndCompareDnodeVnodes(SDnodeObj *pDnode1, SDnodeObj *pDnode2) {
3,590,486✔
938
  float d1Score = mndGetDnodeScore(pDnode1, 0, 0.9);
3,590,486✔
939
  float d2Score = mndGetDnodeScore(pDnode2, 0, 0.9);
3,590,486✔
940
  if (d1Score == d2Score) {
3,590,486✔
941
    return 0;
1,323,579✔
942
  }
943
  return d1Score > d2Score ? 1 : -1;
2,266,907✔
944
}
945

946
void mndSortVnodeGid(SVgObj *pVgroup) {
2,559,953✔
947
  for (int32_t i = 0; i < pVgroup->replica; ++i) {
5,510,600✔
948
    for (int32_t j = 0; j < pVgroup->replica - 1 - i; ++j) {
3,532,959✔
949
      if (pVgroup->vnodeGid[j].dnodeId > pVgroup->vnodeGid[j + 1].dnodeId) {
582,312✔
950
        TSWAP(pVgroup->vnodeGid[j], pVgroup->vnodeGid[j + 1]);
230,638✔
951
      }
952
    }
953
  }
954
}
2,559,953✔
955

956
static int32_t mndGetAvailableDnode(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, SArray *pArray) {
2,524,001✔
957
  mDebug("start to sort %d dnodes", (int32_t)taosArrayGetSize(pArray));
2,524,001✔
958
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
2,524,001✔
959
  for (int32_t i = 0; i < (int32_t)taosArrayGetSize(pArray); ++i) {
6,186,628✔
960
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
3,662,627✔
961
    mDebug("dnode:%d, score:%f", pDnode->id, mndGetDnodeScore(pDnode, 0, 0.9));
3,662,627✔
962
  }
963

964
  int32_t size = taosArrayGetSize(pArray);
2,524,001✔
965
  if (size < pVgroup->replica) {
2,524,001✔
966
    mError("db:%s, vgId:%d, no enough online dnodes:%d to alloc %d replica", pVgroup->dbName, pVgroup->vgId, size,
4,747✔
967
           pVgroup->replica);
968
    TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_DNODES);
4,747✔
969
  }
970

971
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
5,359,156✔
972
    SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
2,839,902✔
973
    SDnodeObj *pDnode = taosArrayGet(pArray, v);
2,839,902✔
974
    if (pDnode == NULL) {
2,839,902✔
975
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_DNODES);
×
976
    }
977
    if (pDnode->numOfVnodes >= pDnode->numOfSupportVnodes) {
2,839,902✔
978
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_VNODES);
×
979
    }
980

981
    int64_t vgMem = mndGetVgroupMemory(pMnode, pDb, pVgroup);
2,839,902✔
982
    if (pDnode->memAvail - vgMem - pDnode->memUsed <= 0) {
2,839,902✔
983
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d, avail:%" PRId64 " used:%" PRId64,
×
984
             pVgroup->dbName, pVgroup->vgId, vgMem, pDnode->id, pDnode->memAvail, pDnode->memUsed);
985
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE);
×
986
    } else {
987
      pDnode->memUsed += vgMem;
2,839,902✔
988
    }
989

990
    pVgid->dnodeId = pDnode->id;
2,839,902✔
991
    if (pVgroup->replica == 1) {
2,839,902✔
992
      pVgid->syncState = TAOS_SYNC_STATE_LEADER;
2,355,936✔
993
    } else {
994
      pVgid->syncState = TAOS_SYNC_STATE_FOLLOWER;
483,966✔
995
    }
996

997
    mInfo("db:%s, vgId:%d, vn:%d is alloced, memory:%" PRId64 ", dnode:%d avail:%" PRId64 " used:%" PRId64,
2,839,902✔
998
          pVgroup->dbName, pVgroup->vgId, v, vgMem, pVgid->dnodeId, pDnode->memAvail, pDnode->memUsed);
999
    pDnode->numOfVnodes++;
2,839,902✔
1000
  }
1001

1002
  mndSortVnodeGid(pVgroup);
2,519,254✔
1003
  return 0;
2,519,254✔
1004
}
1005

1006
int32_t mndAllocSmaVgroup(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup) {
×
1007
  int32_t code = 0;
×
1008
  SArray *pArray = mndBuildDnodesArray(pMnode, 0, NULL);
×
1009
  if (pArray == NULL) {
×
1010
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1011
    if (terrno != 0) code = terrno;
×
1012
    TAOS_RETURN(code);
×
1013
  }
1014

1015
  pVgroup->vgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
×
1016
  pVgroup->isTsma = 1;
×
1017
  pVgroup->createdTime = taosGetTimestampMs();
×
1018
  pVgroup->updateTime = pVgroup->createdTime;
×
1019
  pVgroup->version = 1;
×
1020
  memcpy(pVgroup->dbName, pDb->name, TSDB_DB_FNAME_LEN);
×
1021
  pVgroup->dbUid = pDb->uid;
×
1022
  pVgroup->replica = 1;
×
1023
  pVgroup->keepVersion = -1;  // default: WAL keep version disabled
×
1024
  pVgroup->keepVersionTime = 0;
×
1025

1026
  if (mndGetAvailableDnode(pMnode, pDb, pVgroup, pArray) != 0) return -1;
×
1027
  taosArrayDestroy(pArray);
×
1028

1029
  mInfo("db:%s, sma vgId:%d is alloced", pDb->name, pVgroup->vgId);
×
1030
  return 0;
×
1031
}
1032

1033
int32_t mndAllocVgroup(SMnode *pMnode, SDbObj *pDb, SVgObj **ppVgroups, SArray *dnodeList) {
1,200,364✔
1034
  int32_t code = -1;
1,200,364✔
1035
  SArray *pArray = NULL;
1,200,364✔
1036
  SVgObj *pVgroups = NULL;
1,200,364✔
1037

1038
  pVgroups = taosMemoryCalloc(pDb->cfg.numOfVgroups, sizeof(SVgObj));
1,200,364✔
1039
  if (pVgroups == NULL) {
1,200,364✔
1040
    code = terrno;
×
1041
    goto _OVER;
×
1042
  }
1043

1044
  pArray = mndBuildDnodesArray(pMnode, 0, dnodeList);
1,200,364✔
1045
  if (pArray == NULL) {
1,200,364✔
1046
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1047
    if (terrno != 0) code = terrno;
×
1048
    goto _OVER;
×
1049
  }
1050

1051
  mInfo("db:%s, total %d dnodes used to create %d vgroups (%d vnodes)", pDb->name, (int32_t)taosArrayGetSize(pArray),
1,200,364✔
1052
        pDb->cfg.numOfVgroups, pDb->cfg.numOfVgroups * pDb->cfg.replications);
1053

1054
  int32_t  allocedVgroups = 0;
1,200,364✔
1055
  int32_t  maxVgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
1,200,364✔
1056
  uint32_t hashMin = 0;
1,200,364✔
1057
  uint32_t hashMax = UINT32_MAX;
1,200,364✔
1058
  uint32_t hashInterval = (hashMax - hashMin) / pDb->cfg.numOfVgroups;
1,200,364✔
1059

1060
  if (maxVgId < 2) maxVgId = 2;
1,200,364✔
1061

1062
  for (uint32_t v = 0; v < pDb->cfg.numOfVgroups; v++) {
3,719,618✔
1063
    SVgObj *pVgroup = &pVgroups[v];
2,524,001✔
1064
    pVgroup->vgId = maxVgId++;
2,524,001✔
1065
    pVgroup->createdTime = taosGetTimestampMs();
2,524,001✔
1066
    pVgroup->updateTime = pVgroups->createdTime;
2,524,001✔
1067
    pVgroup->version = 1;
2,524,001✔
1068
    pVgroup->hashBegin = hashMin + hashInterval * v;
2,524,001✔
1069
    if (v == pDb->cfg.numOfVgroups - 1) {
2,524,001✔
1070
      pVgroup->hashEnd = hashMax;
1,198,144✔
1071
    } else {
1072
      pVgroup->hashEnd = hashMin + hashInterval * (v + 1) - 1;
1,325,857✔
1073
    }
1074

1075
    memcpy(pVgroup->dbName, pDb->name, TSDB_DB_FNAME_LEN);
2,524,001✔
1076
    pVgroup->dbUid = pDb->uid;
2,524,001✔
1077
    pVgroup->replica = pDb->cfg.replications;
2,524,001✔
1078
    pVgroup->keepVersion = -1;  // default: WAL keep version disabled
2,524,001✔
1079
    pVgroup->keepVersionTime = 0;
2,524,001✔
1080

1081
    if ((code = mndGetAvailableDnode(pMnode, pDb, pVgroup, pArray)) != 0) {
2,524,001✔
1082
      goto _OVER;
4,747✔
1083
    }
1084

1085
    allocedVgroups++;
2,519,254✔
1086
  }
1087

1088
  *ppVgroups = pVgroups;
1,195,617✔
1089
  code = 0;
1,195,617✔
1090

1091
  mInfo("db:%s, total %d vgroups is alloced, replica:%d", pDb->name, pDb->cfg.numOfVgroups, pDb->cfg.replications);
1,195,617✔
1092

1093
_OVER:
×
1094
  if (code != 0) taosMemoryFree(pVgroups);
1,200,364✔
1095
  taosArrayDestroy(pArray);
1,200,364✔
1096
  TAOS_RETURN(code);
1,200,364✔
1097
}
1098

1099
SEpSet mndGetVgroupEpset(SMnode *pMnode, const SVgObj *pVgroup) {
27,754,854✔
1100
  SEpSet epset = {0};
27,754,854✔
1101

1102
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
63,688,737✔
1103
    const SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
35,933,883✔
1104
    SDnodeObj       *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
35,933,883✔
1105
    if (pDnode == NULL) continue;
35,933,883✔
1106

1107
    if (pVgid->syncState == TAOS_SYNC_STATE_LEADER || pVgid->syncState == TAOS_SYNC_STATE_ASSIGNED_LEADER) {
35,914,894✔
1108
      epset.inUse = epset.numOfEps;
27,392,842✔
1109
    }
1110

1111
    if (addEpIntoEpSet(&epset, pDnode->fqdn, pDnode->port) != 0) {
35,914,894✔
1112
      mWarn("vgId:%d, failed to add ep:%s:%d into epset", pVgroup->vgId, pDnode->fqdn, pDnode->port);
×
1113
    }
1114
    mndReleaseDnode(pMnode, pDnode);
35,914,894✔
1115
  }
1116
  epsetSort(&epset);
27,754,854✔
1117

1118
  return epset;
27,754,854✔
1119
}
1120

1121
SEpSet mndGetVgroupEpsetById(SMnode *pMnode, int32_t vgId) {
643,517✔
1122
  SEpSet epset = {0};
643,517✔
1123

1124
  SVgObj *pVgroup = mndAcquireVgroup(pMnode, vgId);
643,517✔
1125
  if (!pVgroup) return epset;
643,517✔
1126

1127
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
1,365,974✔
1128
    const SVnodeGid *pVgid = &pVgroup->vnodeGid[v];
722,457✔
1129
    SDnodeObj       *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
722,457✔
1130
    if (pDnode == NULL) continue;
722,457✔
1131

1132
    if (pVgid->syncState == TAOS_SYNC_STATE_LEADER || pVgid->syncState == TAOS_SYNC_STATE_ASSIGNED_LEADER) {
722,457✔
1133
      epset.inUse = epset.numOfEps;
614,842✔
1134
    }
1135

1136
    if (addEpIntoEpSet(&epset, pDnode->fqdn, pDnode->port) != 0) {
722,457✔
1137
      mWarn("vgId:%d, failed to add ep:%s:%d into epset", pVgroup->vgId, pDnode->fqdn, pDnode->port);
×
1138
    }
1139
    mndReleaseDnode(pMnode, pDnode);
722,457✔
1140
  }
1141

1142
  mndReleaseVgroup(pMnode, pVgroup);
643,517✔
1143
  return epset;
643,517✔
1144
}
1145

1146
static int32_t mndRetrieveVgroups(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows) {
296,648✔
1147
  SMnode *pMnode = pReq->info.node;
296,648✔
1148
  SSdb   *pSdb = pMnode->pSdb;
296,648✔
1149
  int32_t numOfRows = 0;
296,648✔
1150
  SVgObj *pVgroup = NULL;
296,648✔
1151
  int32_t cols = 0;
296,648✔
1152
  int64_t curMs = taosGetTimestampMs();
296,648✔
1153
  int32_t code = 0, lino = 0;
296,648✔
1154

1155
  SDbObj *pDb = NULL;
296,648✔
1156
  if (strlen(pShow->db) > 0) {
296,648✔
1157
    pDb = mndAcquireDb(pMnode, pShow->db);
236,652✔
1158
    if (pDb == NULL) {
236,652✔
1159
      return 0;
×
1160
    }
1161
  }
1162

1163
  while (numOfRows < rows) {
1,690,793✔
1164
    pShow->pIter = sdbFetch(pSdb, SDB_VGROUP, pShow->pIter, (void **)&pVgroup);
1,690,793✔
1165
    if (pShow->pIter == NULL) break;
1,690,793✔
1166

1167
    if (pDb != NULL && pVgroup->dbUid != pDb->uid) {
1,394,145✔
1168
      sdbRelease(pSdb, pVgroup);
414,892✔
1169
      continue;
414,892✔
1170
    }
1171

1172
    cols = 0;
979,253✔
1173
    SColumnInfoData *pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
979,253✔
1174
    COL_DATA_SET_VAL_GOTO((const char *)&pVgroup->vgId, false, pVgroup, pShow->pIter, _OVER);
979,253✔
1175

1176
    SName name = {0};
979,253✔
1177
    char  db[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
979,253✔
1178
    code = tNameFromString(&name, pVgroup->dbName, T_NAME_ACCT | T_NAME_DB);
979,253✔
1179
    if (code != 0) {
979,253✔
1180
      mError("vgId:%d, failed to set dbName, since %s", pVgroup->vgId, tstrerror(code));
×
1181
      sdbRelease(pSdb, pVgroup);
×
1182
      sdbCancelFetch(pSdb, pShow->pIter);
×
1183
      return code;
×
1184
    }
1185
    (void)tNameGetDbName(&name, varDataVal(db));
979,253✔
1186
    varDataSetLen(db, strlen(varDataVal(db)));
979,253✔
1187

1188
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
979,253✔
1189
    COL_DATA_SET_VAL_GOTO((const char *)db, false, pVgroup, pShow->pIter, _OVER);
979,253✔
1190

1191
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
979,253✔
1192
    COL_DATA_SET_VAL_GOTO((const char *)&pVgroup->numOfTables, false, pVgroup, pShow->pIter, _OVER);
979,253✔
1193

1194
    // default 3 replica, add 1 replica if move vnode
1195
    for (int32_t i = 0; i < 4; ++i) {
4,896,265✔
1196
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
3,917,012✔
1197
      if (i < pVgroup->replica) {
3,917,012✔
1198
        int16_t dnodeId = (int16_t)pVgroup->vnodeGid[i].dnodeId;
2,025,755✔
1199
        COL_DATA_SET_VAL_GOTO((const char *)&dnodeId, false, pVgroup, pShow->pIter, _OVER);
2,025,755✔
1200

1201
        bool       exist = false;
2,025,755✔
1202
        bool       online = false;
2,025,755✔
1203
        SDnodeObj *pDnode = mndAcquireDnode(pMnode, pVgroup->vnodeGid[i].dnodeId);
2,025,755✔
1204
        if (pDnode != NULL) {
2,025,755✔
1205
          exist = true;
2,025,755✔
1206
          online = mndIsDnodeOnline(pDnode, curMs);
2,025,755✔
1207
          mndReleaseDnode(pMnode, pDnode);
2,025,755✔
1208
        }
1209

1210
        char buf1[20] = {0};
2,025,755✔
1211
        char role[20] = "offline";
2,025,755✔
1212
        if (!exist) {
2,025,755✔
1213
          tstrncpy(role, "dropping", sizeof(role));
×
1214
        } else if (online) {
2,025,755✔
1215
          char *star = "";
1,999,718✔
1216
          if (pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_LEADER ||
1,999,718✔
1217
              pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_ASSIGNED_LEADER) {
1,210,351✔
1218
            if (!pVgroup->vnodeGid[i].syncRestore && !pVgroup->vnodeGid[i].syncCanRead) {
789,367✔
1219
              star = "**";
90,058✔
1220
            } else if (!pVgroup->vnodeGid[i].syncRestore && pVgroup->vnodeGid[i].syncCanRead) {
699,309✔
1221
              star = "*";
×
1222
            } else {
1223
            }
1224
          }
1225
          snprintf(role, sizeof(role), "%s%s", syncStr(pVgroup->vnodeGid[i].syncState), star);
1,999,718✔
1226
          /*
1227
          mInfo("db:%s, learner progress:%d", pDb->name, pVgroup->vnodeGid[i].learnerProgress);
1228

1229
          if (pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_LEARNER) {
1230
            if(pVgroup->vnodeGid[i].learnerProgress < 0){
1231
              snprintf(role, sizeof(role), "%s-",
1232
                syncStr(pVgroup->vnodeGid[i].syncState));
1233

1234
            }
1235
            else if(pVgroup->vnodeGid[i].learnerProgress >= 100){
1236
              snprintf(role, sizeof(role), "%s--",
1237
                syncStr(pVgroup->vnodeGid[i].syncState));
1238
            }
1239
            else{
1240
              snprintf(role, sizeof(role), "%s%d",
1241
                syncStr(pVgroup->vnodeGid[i].syncState), pVgroup->vnodeGid[i].learnerProgress);
1242
            }
1243
          }
1244
          else{
1245
            snprintf(role, sizeof(role), "%s%s", syncStr(pVgroup->vnodeGid[i].syncState), star);
1246
          }
1247
          */
1248
        } else {
1249
        }
1250
        STR_WITH_MAXSIZE_TO_VARSTR(buf1, role, pShow->pMeta->pSchemas[cols].bytes);
2,025,755✔
1251

1252
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
2,025,755✔
1253
        COL_DATA_SET_VAL_GOTO((const char *)buf1, false, pVgroup, pShow->pIter, _OVER);
2,025,755✔
1254

1255
        char applyStr[TSDB_SYNC_APPLY_COMMIT_LEN + 1] = {0};
2,025,755✔
1256
        char buf[TSDB_SYNC_APPLY_COMMIT_LEN + VARSTR_HEADER_SIZE + 1] = {0};
2,025,755✔
1257
        snprintf(applyStr, sizeof(applyStr), "%" PRId64 "/%" PRId64, pVgroup->vnodeGid[i].syncAppliedIndex,
2,025,755✔
1258
                 pVgroup->vnodeGid[i].syncCommitIndex);
2,025,755✔
1259
        STR_WITH_MAXSIZE_TO_VARSTR(buf, applyStr, pShow->pMeta->pSchemas[cols].bytes);
2,025,755✔
1260

1261
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
2,025,755✔
1262
        COL_DATA_SET_VAL_GOTO((const char *)&buf, false, pVgroup, pShow->pIter, _OVER);
2,025,755✔
1263
      } else {
1264
        colDataSetNULL(pColInfo, numOfRows);
1,891,257✔
1265
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,891,257✔
1266
        colDataSetNULL(pColInfo, numOfRows);
1,891,257✔
1267
        pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
1,891,257✔
1268
        colDataSetNULL(pColInfo, numOfRows);
1,891,257✔
1269
      }
1270
    }
1271

1272
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
979,253✔
1273
    int32_t cacheUsage = (int32_t)pVgroup->cacheUsage;
979,253✔
1274
    COL_DATA_SET_VAL_GOTO((const char *)&cacheUsage, false, pVgroup, pShow->pIter, _OVER);
979,253✔
1275

1276
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
979,253✔
1277
    COL_DATA_SET_VAL_GOTO((const char *)&pVgroup->numOfCachedTables, false, pVgroup, pShow->pIter, _OVER);
979,253✔
1278

1279
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
979,253✔
1280
    COL_DATA_SET_VAL_GOTO((const char *)&pVgroup->isTsma, false, pVgroup, pShow->pIter, _OVER);
979,253✔
1281

1282
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
979,253✔
1283
    COL_DATA_SET_VAL_GOTO((const char *)&pVgroup->mountVgId, false, pVgroup, pShow->pIter, _OVER);
979,253✔
1284

1285
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
979,253✔
1286
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&pVgroup->keepVersion, false);
979,253✔
1287
    if (code != 0) {
979,253✔
1288
      mError("vgId:%d, failed to set keepVersion, since %s", pVgroup->vgId, tstrerror(code));
×
1289
      return code;
×
1290
    }
1291

1292
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
979,253✔
1293
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&pVgroup->keepVersionTime, false);
979,253✔
1294
    if (code != 0) {
979,253✔
1295
      mError("vgId:%d, failed to set keepVersionTime, since %s", pVgroup->vgId, tstrerror(code));
×
1296
      return code;
×
1297
    }
1298

1299
    numOfRows++;
979,253✔
1300
    sdbRelease(pSdb, pVgroup);
979,253✔
1301
  }
1302
_OVER:
296,648✔
1303
  if (pDb != NULL) {
296,648✔
1304
    mndReleaseDb(pMnode, pDb);
236,652✔
1305
  }
1306
  if (code != 0) {
296,648✔
1307
    mError("failed to retrieve vgroup info at line %d since %s", lino, tstrerror(code));
×
1308
    TAOS_RETURN(code);
×
1309
  }
1310

1311
  pShow->numOfRows += numOfRows;
296,648✔
1312
  return numOfRows;
296,648✔
1313
}
1314

1315
static void mndCancelGetNextVgroup(SMnode *pMnode, void *pIter) {
×
1316
  SSdb *pSdb = pMnode->pSdb;
×
1317
  sdbCancelFetchByType(pSdb, pIter, SDB_VGROUP);
×
1318
}
×
1319

1320
static bool mndGetVnodesNumFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
12,059,272✔
1321
  SVgObj  *pVgroup = pObj;
12,059,272✔
1322
  int32_t  dnodeId = *(int32_t *)p1;
12,059,272✔
1323
  int32_t *pNumOfVnodes = (int32_t *)p2;
12,059,272✔
1324

1325
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
34,456,256✔
1326
    if (pVgroup->vnodeGid[v].dnodeId == dnodeId) {
22,396,984✔
1327
      (*pNumOfVnodes)++;
7,119,872✔
1328
    }
1329
  }
1330

1331
  return true;
12,059,272✔
1332
}
1333

1334
int32_t mndGetVnodesNum(SMnode *pMnode, int32_t dnodeId) {
4,384,255✔
1335
  int32_t numOfVnodes = 0;
4,384,255✔
1336
  sdbTraverse(pMnode->pSdb, SDB_VGROUP, mndGetVnodesNumFp, &dnodeId, &numOfVnodes, NULL);
4,384,255✔
1337
  return numOfVnodes;
4,384,255✔
1338
}
1339

1340
int64_t mndGetVgroupMemory(SMnode *pMnode, SDbObj *pDbInput, SVgObj *pVgroup) {
7,866,705✔
1341
  SDbObj *pDb = pDbInput;
7,866,705✔
1342
  if (pDbInput == NULL) {
7,866,705✔
1343
    pDb = mndAcquireDb(pMnode, pVgroup->dbName);
4,395,255✔
1344
  }
1345

1346
  int64_t vgroupMemroy = 0;
7,866,705✔
1347
  if (pDb != NULL) {
7,866,705✔
1348
    int64_t buffer = (int64_t)pDb->cfg.buffer * 1024 * 1024;
7,866,705✔
1349
    int64_t cache = (int64_t)pDb->cfg.pages * pDb->cfg.pageSize * 1024;
7,866,705✔
1350
    vgroupMemroy = buffer + cache;
7,866,705✔
1351
    int64_t cacheLast = (int64_t)pDb->cfg.cacheLastSize * 1024 * 1024;
7,866,705✔
1352
    if (pDb->cfg.cacheLast > 0) {
7,866,705✔
1353
      vgroupMemroy += cacheLast;
963,186✔
1354
    }
1355
    mDebug("db:%s, vgroup:%d, buffer:%" PRId64 " cache:%" PRId64 " cacheLast:%" PRId64, pDb->name, pVgroup->vgId,
7,866,705✔
1356
           buffer, cache, cacheLast);
1357
  }
1358

1359
  if (pDbInput == NULL) {
7,866,705✔
1360
    mndReleaseDb(pMnode, pDb);
4,395,255✔
1361
  }
1362
  return vgroupMemroy;
7,866,705✔
1363
}
1364

1365
static bool mndGetVnodeMemroyFp(SMnode *pMnode, void *pObj, void *p1, void *p2, void *p3) {
6,230,181✔
1366
  SVgObj  *pVgroup = pObj;
6,230,181✔
1367
  int32_t  dnodeId = *(int32_t *)p1;
6,230,181✔
1368
  int64_t *pVnodeMemory = (int64_t *)p2;
6,230,181✔
1369

1370
  for (int32_t v = 0; v < pVgroup->replica; ++v) {
15,357,866✔
1371
    if (pVgroup->vnodeGid[v].dnodeId == dnodeId) {
9,127,685✔
1372
      *pVnodeMemory += mndGetVgroupMemory(pMnode, NULL, pVgroup);
4,234,357✔
1373
    }
1374
  }
1375

1376
  return true;
6,230,181✔
1377
}
1378

1379
int64_t mndGetVnodesMemory(SMnode *pMnode, int32_t dnodeId) {
1,940,688✔
1380
  int64_t vnodeMemory = 0;
1,940,688✔
1381
  sdbTraverse(pMnode->pSdb, SDB_VGROUP, mndGetVnodeMemroyFp, &dnodeId, &vnodeMemory, NULL);
1,940,688✔
1382
  return vnodeMemory;
1,940,688✔
1383
}
1384

1385
void calculateRstoreFinishTime(double rate, int64_t applyCount, char *restoreStr, size_t restoreStrSize) {
24✔
1386
  if (rate == 0) {
24✔
1387
    snprintf(restoreStr, restoreStrSize, "0:0:0");
24✔
1388
    return;
24✔
1389
  }
1390

1391
  int64_t costTime = applyCount / rate;
×
1392
  int64_t totalSeconds = costTime / 1000;
×
1393
  int64_t hours = totalSeconds / 3600;
×
1394
  totalSeconds %= 3600;
×
1395
  int64_t minutes = totalSeconds / 60;
×
1396
  int64_t seconds = totalSeconds % 60;
×
1397
  snprintf(restoreStr, restoreStrSize, "%" PRId64 ":%" PRId64 ":%" PRId64, hours, minutes, seconds);
×
1398
}
1399

1400
static int32_t mndRetrieveVnodes(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows) {
1,594✔
1401
  SMnode *pMnode = pReq->info.node;
1,594✔
1402
  SSdb   *pSdb = pMnode->pSdb;
1,594✔
1403
  int32_t numOfRows = 0;
1,594✔
1404
  SVgObj *pVgroup = NULL;
1,594✔
1405
  int32_t cols = 0;
1,594✔
1406
  int64_t curMs = taosGetTimestampMs();
1,594✔
1407
  int32_t code = 0;
1,594✔
1408

1409
  while (numOfRows < rows - TSDB_MAX_REPLICA) {
5,052✔
1410
    pShow->pIter = sdbFetch(pSdb, SDB_VGROUP, pShow->pIter, (void **)&pVgroup);
5,052✔
1411
    if (pShow->pIter == NULL) break;
5,052✔
1412

1413
    for (int32_t i = 0; i < pVgroup->replica && numOfRows < rows; ++i) {
9,068✔
1414
      SVnodeGid       *pGid = &pVgroup->vnodeGid[i];
5,610✔
1415
      SColumnInfoData *pColInfo = NULL;
5,610✔
1416
      cols = 0;
5,610✔
1417

1418
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
5,610✔
1419
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->dnodeId, false);
5,610✔
1420
      if (code != 0) {
5,610✔
1421
        mError("vgId:%d, failed to set dnodeId, since %s", pVgroup->vgId, tstrerror(code));
×
1422
        return code;
×
1423
      }
1424
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
5,610✔
1425
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pVgroup->vgId, false);
5,610✔
1426
      if (code != 0) {
5,610✔
1427
        mError("vgId:%d, failed to set vgId, since %s", pVgroup->vgId, tstrerror(code));
×
1428
        return code;
×
1429
      }
1430

1431
      // db_name
1432
      const char *dbname = mndGetDbStr(pVgroup->dbName);
5,610✔
1433
      char        b1[TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE] = {0};
5,610✔
1434
      if (dbname != NULL) {
5,610✔
1435
        STR_WITH_MAXSIZE_TO_VARSTR(b1, dbname, TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE);
5,610✔
1436
      } else {
1437
        STR_WITH_MAXSIZE_TO_VARSTR(b1, "NULL", TSDB_DB_NAME_LEN + VARSTR_HEADER_SIZE);
×
1438
      }
1439
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
5,610✔
1440
      code = colDataSetVal(pColInfo, numOfRows, (const char *)b1, false);
5,610✔
1441
      if (code != 0) {
5,610✔
1442
        mError("vgId:%d, failed to set dbName, since %s", pVgroup->vgId, tstrerror(code));
×
1443
        return code;
×
1444
      }
1445

1446
      // dnode is online?
1447
      SDnodeObj *pDnode = mndAcquireDnode(pMnode, pGid->dnodeId);
5,610✔
1448
      if (pDnode == NULL) {
5,610✔
1449
        mError("failed to acquire dnode. dnodeId:%d", pGid->dnodeId);
×
1450
        break;
×
1451
      }
1452
      bool isDnodeOnline = mndIsDnodeOnline(pDnode, curMs);
5,610✔
1453

1454
      char       buf[20] = {0};
5,610✔
1455
      ESyncState syncState = (isDnodeOnline) ? pGid->syncState : TAOS_SYNC_STATE_OFFLINE;
5,610✔
1456
      STR_TO_VARSTR(buf, syncStr(syncState));
5,610✔
1457
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
5,610✔
1458
      code = colDataSetVal(pColInfo, numOfRows, (const char *)buf, false);
5,610✔
1459
      if (code != 0) {
5,610✔
1460
        mError("vgId:%d, failed to set syncState, since %s", pVgroup->vgId, tstrerror(code));
×
1461
        return code;
×
1462
      }
1463

1464
      int64_t roleTimeMs = (isDnodeOnline) ? pGid->roleTimeMs : 0;
5,610✔
1465
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
5,610✔
1466
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&roleTimeMs, false);
5,610✔
1467
      if (code != 0) {
5,610✔
1468
        mError("vgId:%d, failed to set roleTimeMs, since %s", pVgroup->vgId, tstrerror(code));
×
1469
        return code;
×
1470
      }
1471

1472
      int64_t startTimeMs = (isDnodeOnline) ? pGid->startTimeMs : 0;
5,610✔
1473
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
5,610✔
1474
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&startTimeMs, false);
5,610✔
1475
      if (code != 0) {
5,610✔
1476
        mError("vgId:%d, failed to set startTimeMs, since %s", pVgroup->vgId, tstrerror(code));
×
1477
        return code;
×
1478
      }
1479

1480
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
5,610✔
1481
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->syncRestore, false);
5,610✔
1482
      if (code != 0) {
5,610✔
1483
        mError("vgId:%d, failed to set syncRestore, since %s", pVgroup->vgId, tstrerror(code));
×
1484
        return code;
×
1485
      }
1486

1487
      int64_t unappliedCount = pGid->syncCommitIndex - pGid->syncAppliedIndex;
5,610✔
1488
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
5,610✔
1489
      char restoreStr[20] = {0};
5,610✔
1490
      if (unappliedCount > 0) {
5,610✔
1491
        calculateRstoreFinishTime(pGid->appliedRate, unappliedCount, restoreStr, sizeof(restoreStr));
24✔
1492
      }
1493
      STR_TO_VARSTR(buf, restoreStr);
5,610✔
1494
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&buf, false);
5,610✔
1495
      if (code != 0) {
5,610✔
1496
        mError("vgId:%d, failed to set syncRestore finish time, since %s", pVgroup->vgId, tstrerror(code));
×
1497
        return code;
×
1498
      }
1499

1500
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
5,610✔
1501
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&unappliedCount, false);
5,610✔
1502
      if (code != 0) {
5,610✔
1503
        mError("vgId:%d, failed to set syncRestore, since %s", pVgroup->vgId, tstrerror(code));
×
1504
        return code;
×
1505
      }
1506

1507
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
5,610✔
1508
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->bufferSegmentUsed, false);
5,610✔
1509
      if (code != 0) {
5,610✔
1510
        mError("vgId:%d, failed to set buffer segment used, since %s", pVgroup->vgId, tstrerror(code));
×
1511
        return code;
×
1512
      }
1513

1514
      pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
5,610✔
1515
      code = colDataSetVal(pColInfo, numOfRows, (const char *)&pGid->bufferSegmentSize, false);
5,610✔
1516
      if (code != 0) {
5,610✔
1517
        mError("vgId:%d, failed to set buffer segment size, since %s", pVgroup->vgId, tstrerror(code));
×
1518
        return code;
×
1519
      }
1520

1521
      numOfRows++;
5,610✔
1522
      sdbRelease(pSdb, pDnode);
5,610✔
1523
    }
1524

1525
    sdbRelease(pSdb, pVgroup);
3,458✔
1526
  }
1527

1528
  pShow->numOfRows += numOfRows;
1,594✔
1529
  return numOfRows;
1,594✔
1530
}
1531

1532
static void mndCancelGetNextVnode(SMnode *pMnode, void *pIter) {
×
1533
  SSdb *pSdb = pMnode->pSdb;
×
1534
  sdbCancelFetchByType(pSdb, pIter, SDB_VGROUP);
×
1535
}
×
1536

1537
static int32_t mndAddVnodeToVgroup(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, SArray *pArray) {
94,412✔
1538
  int32_t code = 0;
94,412✔
1539
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
94,412✔
1540
  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
392,345✔
1541
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
297,933✔
1542
    mInfo("trans:%d, dnode:%d, equivalent vnodes:%d others:%d", pTrans->id, pDnode->id, pDnode->numOfVnodes,
297,933✔
1543
          pDnode->numOfOtherNodes);
1544
  }
1545

1546
  SVnodeGid *pVgid = &pVgroup->vnodeGid[pVgroup->replica];
94,412✔
1547
  for (int32_t d = 0; d < taosArrayGetSize(pArray); ++d) {
119,638✔
1548
    SDnodeObj *pDnode = taosArrayGet(pArray, d);
118,815✔
1549

1550
    bool used = false;
118,815✔
1551
    for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
278,034✔
1552
      if (pDnode->id == pVgroup->vnodeGid[vn].dnodeId) {
184,445✔
1553
        used = true;
25,226✔
1554
        break;
25,226✔
1555
      }
1556
    }
1557
    if (used) continue;
118,815✔
1558

1559
    if (pDnode == NULL) {
93,589✔
1560
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_DNODES);
×
1561
    }
1562
    if (pDnode->numOfVnodes >= pDnode->numOfSupportVnodes) {
93,589✔
1563
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_VNODES);
×
1564
    }
1565

1566
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
93,589✔
1567
    if (pDnode->memAvail - vgMem - pDnode->memUsed <= 0) {
93,589✔
1568
      mError("trans:%d, db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
1569
             pTrans->id, pVgroup->dbName, pVgroup->vgId, vgMem, pDnode->id, pDnode->memAvail, pDnode->memUsed);
1570
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE);
×
1571
    } else {
1572
      pDnode->memUsed += vgMem;
93,589✔
1573
    }
1574

1575
    pVgid->dnodeId = pDnode->id;
93,589✔
1576
    pVgid->syncState = TAOS_SYNC_STATE_OFFLINE;
93,589✔
1577
    mInfo("trans:%id, db:%s, vgId:%d, vn:%d is added, memory:%" PRId64 ", dnode:%d avail:%" PRId64 " used:%" PRId64,
93,589✔
1578
          pTrans->id, pVgroup->dbName, pVgroup->vgId, pVgroup->replica, vgMem, pVgid->dnodeId, pDnode->memAvail,
1579
          pDnode->memUsed);
1580

1581
    pVgroup->replica++;
93,589✔
1582
    pDnode->numOfVnodes++;
93,589✔
1583

1584
    SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
93,589✔
1585
    if (pVgRaw == NULL) {
93,589✔
1586
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1587
      if (terrno != 0) code = terrno;
×
1588
      TAOS_RETURN(code);
×
1589
    }
1590
    if ((code = mndTransAppendGroupRedolog(pTrans, pVgRaw, pVgroup->vgId)) != 0) {
93,589✔
1591
      sdbFreeRaw(pVgRaw);
×
1592
      TAOS_RETURN(code);
×
1593
    }
1594
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
93,589✔
1595
    if (code != 0) {
93,589✔
1596
      mError("trans:%d, vgId:%d, failed to set raw status since %s at line:%d", pTrans->id, pVgroup->vgId,
×
1597
             tstrerror(code), __LINE__);
1598
    }
1599
    TAOS_RETURN(code);
93,589✔
1600
  }
1601

1602
  code = TSDB_CODE_MND_NO_ENOUGH_DNODES;
823✔
1603
  mError("trans:%d, db:%s, failed to add vnode to vgId:%d since %s", pTrans->id, pVgroup->dbName, pVgroup->vgId,
823✔
1604
         tstrerror(code));
1605
  TAOS_RETURN(code);
823✔
1606
}
1607

1608
static int32_t mndRemoveVnodeFromVgroup(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, SArray *pArray,
17,714✔
1609
                                        SVnodeGid *pDelVgid) {
1610
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
17,714✔
1611
  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
77,903✔
1612
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
60,189✔
1613
    mInfo("trans:%d, dnode:%d, equivalent vnodes:%d others:%d", pTrans->id, pDnode->id, pDnode->numOfVnodes,
60,189✔
1614
          pDnode->numOfOtherNodes);
1615
  }
1616

1617
  int32_t code = -1;
17,714✔
1618
  for (int32_t d = taosArrayGetSize(pArray) - 1; d >= 0; --d) {
22,882✔
1619
    SDnodeObj *pDnode = taosArrayGet(pArray, d);
22,818✔
1620

1621
    for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
43,800✔
1622
      SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
38,632✔
1623
      if (pVgid->dnodeId == pDnode->id) {
38,632✔
1624
        int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
17,650✔
1625
        pDnode->memUsed -= vgMem;
17,650✔
1626
        mInfo("trans:%d, db:%s, vgId:%d, vn:%d is removed, memory:%" PRId64 ", dnode:%d avail:%" PRId64
17,650✔
1627
              " used:%" PRId64,
1628
              pTrans->id, pVgroup->dbName, pVgroup->vgId, vn, vgMem, pVgid->dnodeId, pDnode->memAvail, pDnode->memUsed);
1629
        pDnode->numOfVnodes--;
17,650✔
1630
        pVgroup->replica--;
17,650✔
1631
        *pDelVgid = *pVgid;
17,650✔
1632
        *pVgid = pVgroup->vnodeGid[pVgroup->replica];
17,650✔
1633
        memset(&pVgroup->vnodeGid[pVgroup->replica], 0, sizeof(SVnodeGid));
17,650✔
1634
        code = 0;
17,650✔
1635
        goto _OVER;
17,650✔
1636
      }
1637
    }
1638
  }
1639

1640
_OVER:
64✔
1641
  if (code != 0) {
17,714✔
1642
    code = TSDB_CODE_APP_ERROR;
64✔
1643
    mError("trans:%d, db:%s, failed to remove vnode from vgId:%d since %s", pTrans->id, pVgroup->dbName, pVgroup->vgId,
64✔
1644
           tstrerror(code));
1645
    TAOS_RETURN(code);
64✔
1646
  }
1647

1648
  for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
48,009✔
1649
    SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
30,359✔
1650
    mInfo("trans:%d, db:%s, vgId:%d, vn:%d dnode:%d is reserved", pTrans->id, pVgroup->dbName, pVgroup->vgId, vn,
30,359✔
1651
          pVgid->dnodeId);
1652
  }
1653

1654
  SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
17,650✔
1655
  if (pVgRaw == NULL) {
17,650✔
1656
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1657
    if (terrno != 0) code = terrno;
×
1658
    TAOS_RETURN(code);
×
1659
  }
1660
  if (mndTransAppendGroupRedolog(pTrans, pVgRaw, pVgroup->vgId) != 0) {
17,650✔
1661
    sdbFreeRaw(pVgRaw);
×
1662
    TAOS_RETURN(code);
×
1663
  }
1664
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
17,650✔
1665
  if (code != 0) {
17,650✔
1666
    mError("trans:%d, vgId:%d, failed to set raw status since %s at line:%d", pTrans->id, pVgroup->vgId,
×
1667
           tstrerror(code), __LINE__);
1668
  }
1669

1670
  TAOS_RETURN(code);
17,650✔
1671
}
1672

1673
static int32_t mndRemoveVnodeFromVgroupWithoutSave(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, SArray *pArray,
×
1674
                                                   SVnodeGid *pDelVgid) {
1675
  taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
×
1676
  for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
×
1677
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
×
1678
    mInfo("dnode:%d, equivalent vnodes:%d others:%d", pDnode->id, pDnode->numOfVnodes, pDnode->numOfOtherNodes);
×
1679
  }
1680

1681
  int32_t code = -1;
×
1682
  for (int32_t d = taosArrayGetSize(pArray) - 1; d >= 0; --d) {
×
1683
    SDnodeObj *pDnode = taosArrayGet(pArray, d);
×
1684

1685
    for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
×
1686
      SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
×
1687
      if (pVgid->dnodeId == pDnode->id) {
×
1688
        int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
×
1689
        pDnode->memUsed -= vgMem;
×
1690
        mInfo("db:%s, vgId:%d, vn:%d is removed, memory:%" PRId64 ", dnode:%d avail:%" PRId64 " used:%" PRId64,
×
1691
              pVgroup->dbName, pVgroup->vgId, vn, vgMem, pVgid->dnodeId, pDnode->memAvail, pDnode->memUsed);
1692
        pDnode->numOfVnodes--;
×
1693
        pVgroup->replica--;
×
1694
        *pDelVgid = *pVgid;
×
1695
        *pVgid = pVgroup->vnodeGid[pVgroup->replica];
×
1696
        memset(&pVgroup->vnodeGid[pVgroup->replica], 0, sizeof(SVnodeGid));
×
1697
        code = 0;
×
1698
        goto _OVER;
×
1699
      }
1700
    }
1701
  }
1702

1703
_OVER:
×
1704
  if (code != 0) {
×
1705
    code = TSDB_CODE_APP_ERROR;
×
1706
    mError("db:%s, failed to remove vnode from vgId:%d since %s", pVgroup->dbName, pVgroup->vgId, tstrerror(code));
×
1707
    TAOS_RETURN(code);
×
1708
  }
1709

1710
  for (int32_t vn = 0; vn < pVgroup->replica; ++vn) {
×
1711
    SVnodeGid *pVgid = &pVgroup->vnodeGid[vn];
×
1712
    mInfo("db:%s, vgId:%d, vn:%d dnode:%d is reserved", pVgroup->dbName, pVgroup->vgId, vn, pVgid->dnodeId);
×
1713
  }
1714

1715
  TAOS_RETURN(code);
×
1716
}
1717

1718
int32_t mndAddCreateVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, SVnodeGid *pVgid) {
2,998,405✔
1719
  int32_t      code = 0;
2,998,405✔
1720
  STransAction action = {0};
2,998,405✔
1721

1722
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
2,998,405✔
1723
  if (pDnode == NULL) return -1;
2,998,405✔
1724
  action.epSet = mndGetDnodeEpset(pDnode);
2,998,405✔
1725
  mndReleaseDnode(pMnode, pDnode);
2,998,405✔
1726

1727
  int32_t contLen = 0;
2,998,405✔
1728
  void   *pReq = mndBuildCreateVnodeReq(pMnode, pDnode, pDb, pVgroup, &contLen);
2,998,405✔
1729
  if (pReq == NULL) return -1;
2,998,405✔
1730

1731
  action.pCont = pReq;
2,998,405✔
1732
  action.contLen = contLen;
2,998,405✔
1733
  action.msgType = TDMT_DND_CREATE_VNODE;
2,998,405✔
1734
  action.acceptableCode = TSDB_CODE_VND_ALREADY_EXIST;
2,998,405✔
1735
  action.groupId = pVgroup->vgId;
2,998,405✔
1736

1737
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
2,998,405✔
1738
    taosMemoryFree(pReq);
×
1739
    TAOS_RETURN(code);
×
1740
  }
1741

1742
  TAOS_RETURN(code);
2,998,405✔
1743
}
1744

1745
int32_t mndRestoreAddCreateVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
6,095✔
1746
                                       SDnodeObj *pDnode) {
1747
  int32_t      code = 0;
6,095✔
1748
  STransAction action = {0};
6,095✔
1749

1750
  action.epSet = mndGetDnodeEpset(pDnode);
6,095✔
1751

1752
  int32_t contLen = 0;
6,095✔
1753
  void   *pReq = mndBuildCreateVnodeReq(pMnode, pDnode, pDb, pVgroup, &contLen);
6,095✔
1754
  if (pReq == NULL) {
6,095✔
1755
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1756
    if (terrno != 0) code = terrno;
×
1757
    TAOS_RETURN(code);
×
1758
  }
1759

1760
  action.pCont = pReq;
6,095✔
1761
  action.contLen = contLen;
6,095✔
1762
  action.msgType = TDMT_DND_CREATE_VNODE;
6,095✔
1763
  action.acceptableCode = TSDB_CODE_VND_ALREADY_EXIST;
6,095✔
1764
  action.groupId = pVgroup->vgId;
6,095✔
1765

1766
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
6,095✔
1767
    taosMemoryFree(pReq);
×
1768
    TAOS_RETURN(code);
×
1769
  }
1770

1771
  TAOS_RETURN(code);
6,095✔
1772
}
1773

1774
int32_t mndAddAlterVnodeConfirmAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup) {
301,903✔
1775
  int32_t      code = 0;
301,903✔
1776
  STransAction action = {0};
301,903✔
1777
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
301,903✔
1778

1779
  mInfo("trans:%d, vgId:%d, build alter vnode confirm req", pTrans->id, pVgroup->vgId);
301,903✔
1780
  int32_t   contLen = sizeof(SMsgHead);
301,903✔
1781
  SMsgHead *pHead = taosMemoryMalloc(contLen);
301,903✔
1782
  if (pHead == NULL) {
301,903✔
1783
    TAOS_RETURN(terrno);
×
1784
  }
1785

1786
  pHead->contLen = htonl(contLen);
301,903✔
1787
  pHead->vgId = htonl(pVgroup->vgId);
301,903✔
1788

1789
  action.pCont = pHead;
301,903✔
1790
  action.contLen = contLen;
301,903✔
1791
  action.msgType = TDMT_VND_ALTER_CONFIRM;
301,903✔
1792
  // incorrect redirect result will cause this erro
1793
  action.retryCode = TSDB_CODE_VND_INVALID_VGROUP_ID;
301,903✔
1794
  action.groupId = pVgroup->vgId;
301,903✔
1795

1796
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
301,903✔
1797
    taosMemoryFree(pHead);
×
1798
    TAOS_RETURN(code);
×
1799
  }
1800

1801
  TAOS_RETURN(code);
301,903✔
1802
}
1803

1804
int32_t mndAddChangeConfigAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pOldVgroup, SVgObj *pNewVgroup,
×
1805
                                 int32_t dnodeId) {
1806
  int32_t      code = 0;
×
1807
  STransAction action = {0};
×
1808
  action.epSet = mndGetVgroupEpset(pMnode, pNewVgroup);
×
1809

1810
  int32_t contLen = 0;
×
1811
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pNewVgroup, dnodeId, &contLen);
×
1812
  if (pReq == NULL) {
×
1813
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1814
    if (terrno != 0) code = terrno;
×
1815
    TAOS_RETURN(code);
×
1816
  }
1817

1818
  int32_t totallen = contLen + sizeof(SMsgHead);
×
1819

1820
  SMsgHead *pHead = taosMemoryMalloc(totallen);
×
1821
  if (pHead == NULL) {
×
1822
    taosMemoryFree(pReq);
×
1823
    TAOS_RETURN(terrno);
×
1824
  }
1825

1826
  pHead->contLen = htonl(totallen);
×
1827
  pHead->vgId = htonl(pNewVgroup->vgId);
×
1828

1829
  memcpy((void *)(pHead + 1), pReq, contLen);
×
1830
  taosMemoryFree(pReq);
×
1831

1832
  action.pCont = pHead;
×
1833
  action.contLen = totallen;
×
1834
  action.msgType = TDMT_SYNC_CONFIG_CHANGE;
×
1835

1836
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
×
1837
    taosMemoryFree(pHead);
×
1838
    TAOS_RETURN(code);
×
1839
  }
1840

1841
  TAOS_RETURN(code);
×
1842
}
1843

1844
static int32_t mndAddAlterVnodeHashRangeAction(SMnode *pMnode, STrans *pTrans, int32_t srcVgId, SVgObj *pVgroup) {
30,266✔
1845
  int32_t      code = 0;
30,266✔
1846
  STransAction action = {0};
30,266✔
1847
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
30,266✔
1848

1849
  int32_t contLen = 0;
30,266✔
1850
  void   *pReq = mndBuildAlterVnodeHashRangeReq(pMnode, srcVgId, pVgroup, &contLen);
30,266✔
1851
  if (pReq == NULL) {
30,266✔
1852
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1853
    if (terrno != 0) code = terrno;
×
1854
    TAOS_RETURN(code);
×
1855
  }
1856

1857
  action.pCont = pReq;
30,266✔
1858
  action.contLen = contLen;
30,266✔
1859
  action.msgType = TDMT_VND_ALTER_HASHRANGE;
30,266✔
1860
  action.acceptableCode = TSDB_CODE_VND_ALREADY_EXIST;
30,266✔
1861

1862
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
30,266✔
1863
    taosMemoryFree(pReq);
×
1864
    TAOS_RETURN(code);
×
1865
  }
1866

1867
  mInfo("trans:%d, add alter vnode hash range action for from vgId:%d to vgId:%d", pTrans->id, srcVgId, pVgroup->vgId);
30,266✔
1868
  TAOS_RETURN(code);
30,266✔
1869
}
1870

1871
int32_t mndAddAlterVnodeConfigAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup) {
208,644✔
1872
  int32_t      code = 0;
208,644✔
1873
  STransAction action = {0};
208,644✔
1874
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
208,644✔
1875

1876
  int32_t contLen = 0;
208,644✔
1877
  void   *pReq = mndBuildAlterVnodeConfigReq(pMnode, pDb, pVgroup, &contLen);
208,644✔
1878
  if (pReq == NULL) {
208,644✔
1879
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1880
    if (terrno != 0) code = terrno;
×
1881
    TAOS_RETURN(code);
×
1882
  }
1883

1884
  action.pCont = pReq;
208,644✔
1885
  action.contLen = contLen;
208,644✔
1886
  action.msgType = TDMT_VND_ALTER_CONFIG;
208,644✔
1887
  action.groupId = pVgroup->vgId;
208,644✔
1888

1889
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
208,644✔
1890
    taosMemoryFree(pReq);
×
1891
    TAOS_RETURN(code);
×
1892
  }
1893

1894
  TAOS_RETURN(code);
208,644✔
1895
}
1896

1897
int32_t mndAddNewVgPrepareAction(SMnode *pMnode, STrans *pTrans, SVgObj *pVg) {
2,552,068✔
1898
  int32_t  code = 0;
2,552,068✔
1899
  SSdbRaw *pRaw = mndVgroupActionEncode(pVg);
2,552,068✔
1900
  if (pRaw == NULL) {
2,552,068✔
1901
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1902
    if (terrno != 0) code = terrno;
×
1903
    goto _err;
×
1904
  }
1905

1906
  TAOS_CHECK_GOTO(mndTransAppendPrepareLog(pTrans, pRaw), NULL, _err);
2,552,068✔
1907
  if (sdbSetRawStatus(pRaw, SDB_STATUS_CREATING) != 0) {
2,552,068✔
1908
    mError("vgId:%d, failed to set raw status at line:%d", pVg->vgId, __LINE__);
×
1909
  }
1910
  if (code != 0) {
2,552,068✔
1911
    mError("vgId:%d, failed to set raw status since %s at line:%d", pVg->vgId, tstrerror(code), __LINE__);
×
1912
    TAOS_RETURN(code);
×
1913
  }
1914
  pRaw = NULL;
2,552,068✔
1915
  TAOS_RETURN(code);
2,552,068✔
1916

1917
_err:
×
1918
  sdbFreeRaw(pRaw);
×
1919
  TAOS_RETURN(code);
×
1920
}
1921

1922
int32_t mndAddAlterVnodeReplicaAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId) {
713,311✔
1923
  int32_t    code = 0;
713,311✔
1924
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
713,311✔
1925
  if (pDnode == NULL) {
713,311✔
1926
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1927
    if (terrno != 0) code = terrno;
×
1928
    TAOS_RETURN(code);
×
1929
  }
1930

1931
  STransAction action = {0};
713,311✔
1932
  action.epSet = mndGetDnodeEpset(pDnode);
713,311✔
1933
  mndReleaseDnode(pMnode, pDnode);
713,311✔
1934

1935
  int32_t contLen = 0;
713,311✔
1936
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pVgroup, dnodeId, &contLen);
713,311✔
1937
  if (pReq == NULL) {
713,311✔
1938
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1939
    if (terrno != 0) code = terrno;
×
1940
    TAOS_RETURN(code);
×
1941
  }
1942

1943
  action.pCont = pReq;
713,311✔
1944
  action.contLen = contLen;
713,311✔
1945
  action.msgType = TDMT_VND_ALTER_REPLICA;
713,311✔
1946
  action.groupId = pVgroup->vgId;
713,311✔
1947

1948
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
713,311✔
1949
    taosMemoryFree(pReq);
×
1950
    TAOS_RETURN(code);
×
1951
  }
1952

1953
  TAOS_RETURN(code);
713,311✔
1954
}
1955

1956
int32_t mndAddCheckLearnerCatchupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId) {
×
1957
  int32_t    code = 0;
×
1958
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
×
1959
  if (pDnode == NULL) {
×
1960
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1961
    if (terrno != 0) code = terrno;
×
1962
    TAOS_RETURN(code);
×
1963
  }
1964

1965
  STransAction action = {0};
×
1966
  action.epSet = mndGetDnodeEpset(pDnode);
×
1967
  mndReleaseDnode(pMnode, pDnode);
×
1968

1969
  int32_t contLen = 0;
×
1970
  void   *pReq = mndBuildCheckLearnCatchupReq(pMnode, pDb, pVgroup, dnodeId, &contLen);
×
1971
  if (pReq == NULL) {
×
1972
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1973
    if (terrno != 0) code = terrno;
×
1974
    TAOS_RETURN(code);
×
1975
  }
1976

1977
  action.pCont = pReq;
×
1978
  action.contLen = contLen;
×
1979
  action.msgType = TDMT_DND_CHECK_VNODE_LEARNER_CATCHUP;
×
1980
  action.acceptableCode = TSDB_CODE_VND_ALREADY_IS_VOTER;
×
1981
  action.retryCode = TSDB_CODE_VND_NOT_CATCH_UP;
×
1982

1983
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
×
1984
    taosMemoryFree(pReq);
×
1985
    TAOS_RETURN(code);
×
1986
  }
1987

1988
  TAOS_RETURN(code);
×
1989
}
1990

1991
int32_t mndAddAlterVnodeTypeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId) {
107,389✔
1992
  int32_t    code = 0;
107,389✔
1993
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
107,389✔
1994
  if (pDnode == NULL) {
107,389✔
1995
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
1996
    if (terrno != 0) code = terrno;
×
1997
    TAOS_RETURN(code);
×
1998
  }
1999

2000
  STransAction action = {0};
107,389✔
2001
  action.epSet = mndGetDnodeEpset(pDnode);
107,389✔
2002
  mndReleaseDnode(pMnode, pDnode);
107,389✔
2003

2004
  int32_t contLen = 0;
107,389✔
2005
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pVgroup, dnodeId, &contLen);
107,389✔
2006
  if (pReq == NULL) {
107,389✔
2007
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2008
    if (terrno != 0) code = terrno;
×
2009
    TAOS_RETURN(code);
×
2010
  }
2011

2012
  action.pCont = pReq;
107,389✔
2013
  action.contLen = contLen;
107,389✔
2014
  action.msgType = TDMT_DND_ALTER_VNODE_TYPE;
107,389✔
2015
  action.acceptableCode = TSDB_CODE_VND_ALREADY_IS_VOTER;
107,389✔
2016
  action.retryCode = TSDB_CODE_VND_NOT_CATCH_UP;
107,389✔
2017
  action.groupId = pVgroup->vgId;
107,389✔
2018

2019
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
107,389✔
2020
    taosMemoryFree(pReq);
×
2021
    TAOS_RETURN(code);
×
2022
  }
2023

2024
  TAOS_RETURN(code);
107,389✔
2025
}
2026

2027
int32_t mndRestoreAddAlterVnodeTypeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
6,095✔
2028
                                          SDnodeObj *pDnode) {
2029
  int32_t      code = 0;
6,095✔
2030
  STransAction action = {0};
6,095✔
2031
  action.epSet = mndGetDnodeEpset(pDnode);
6,095✔
2032

2033
  int32_t contLen = 0;
6,095✔
2034
  void   *pReq = mndBuildAlterVnodeReplicaReq(pMnode, pDb, pVgroup, pDnode->id, &contLen);
6,095✔
2035
  if (pReq == NULL) {
6,095✔
2036
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2037
    if (terrno != 0) code = terrno;
×
2038
    TAOS_RETURN(code);
×
2039
  }
2040

2041
  action.pCont = pReq;
6,095✔
2042
  action.contLen = contLen;
6,095✔
2043
  action.msgType = TDMT_DND_ALTER_VNODE_TYPE;
6,095✔
2044
  action.acceptableCode = TSDB_CODE_VND_ALREADY_IS_VOTER;
6,095✔
2045
  action.retryCode = TSDB_CODE_VND_NOT_CATCH_UP;
6,095✔
2046
  action.groupId = pVgroup->vgId;
6,095✔
2047

2048
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
6,095✔
2049
    taosMemoryFree(pReq);
×
2050
    TAOS_RETURN(code);
×
2051
  }
2052

2053
  TAOS_RETURN(code);
6,095✔
2054
}
2055

2056
static int32_t mndAddDisableVnodeWriteAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
30,266✔
2057
                                             int32_t dnodeId) {
2058
  int32_t    code = 0;
30,266✔
2059
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
30,266✔
2060
  if (pDnode == NULL) {
30,266✔
2061
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2062
    if (terrno != 0) code = terrno;
×
2063
    TAOS_RETURN(code);
×
2064
  }
2065

2066
  STransAction action = {0};
30,266✔
2067
  action.epSet = mndGetDnodeEpset(pDnode);
30,266✔
2068
  mndReleaseDnode(pMnode, pDnode);
30,266✔
2069

2070
  int32_t contLen = 0;
30,266✔
2071
  void   *pReq = mndBuildDisableVnodeWriteReq(pMnode, pDb, pVgroup->vgId, &contLen);
30,266✔
2072
  if (pReq == NULL) {
30,266✔
2073
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2074
    if (terrno != 0) code = terrno;
×
2075
    TAOS_RETURN(code);
×
2076
  }
2077

2078
  action.pCont = pReq;
30,266✔
2079
  action.contLen = contLen;
30,266✔
2080
  action.msgType = TDMT_VND_DISABLE_WRITE;
30,266✔
2081

2082
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
30,266✔
2083
    taosMemoryFree(pReq);
×
2084
    TAOS_RETURN(code);
×
2085
  }
2086

2087
  TAOS_RETURN(code);
30,266✔
2088
}
2089

2090
int32_t mndAddDropVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, SVnodeGid *pVgid,
4,465,971✔
2091
                              bool isRedo) {
2092
  int32_t      code = 0;
4,465,971✔
2093
  STransAction action = {0};
4,465,971✔
2094

2095
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, pVgid->dnodeId);
4,465,971✔
2096
  if (pDnode == NULL) {
4,465,971✔
2097
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2098
    if (terrno != 0) code = terrno;
×
2099
    TAOS_RETURN(code);
×
2100
  }
2101
  action.epSet = mndGetDnodeEpset(pDnode);
4,465,971✔
2102
  mndReleaseDnode(pMnode, pDnode);
4,465,971✔
2103

2104
  int32_t contLen = 0;
4,465,971✔
2105
  void   *pReq = mndBuildDropVnodeReq(pMnode, pDnode, pDb, pVgroup, &contLen);
4,465,971✔
2106
  if (pReq == NULL) {
4,465,971✔
2107
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2108
    if (terrno != 0) code = terrno;
×
2109
    TAOS_RETURN(code);
×
2110
  }
2111

2112
  action.pCont = pReq;
4,465,971✔
2113
  action.contLen = contLen;
4,465,971✔
2114
  action.msgType = TDMT_DND_DROP_VNODE;
4,465,971✔
2115
  action.acceptableCode = TSDB_CODE_VND_NOT_EXIST;
4,465,971✔
2116
  action.groupId = pVgroup->vgId;
4,465,971✔
2117

2118
  if (isRedo) {
4,465,971✔
2119
    if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
1,626,069✔
2120
      taosMemoryFree(pReq);
×
2121
      TAOS_RETURN(code);
×
2122
    }
2123
  } else {
2124
    if ((code = mndTransAppendUndoAction(pTrans, &action)) != 0) {
2,839,902✔
2125
      taosMemoryFree(pReq);
×
2126
      TAOS_RETURN(code);
×
2127
    }
2128
  }
2129

2130
  TAOS_RETURN(code);
4,465,971✔
2131
}
2132

2133
int32_t mndSetMoveVgroupInfoToTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t vnIndex,
16,826✔
2134
                                    SArray *pArray, bool force, bool unsafe) {
2135
  int32_t code = 0;
16,826✔
2136
  SVgObj  newVg = {0};
16,826✔
2137
  memcpy(&newVg, pVgroup, sizeof(SVgObj));
16,826✔
2138

2139
  mInfo("vgId:%d, trans:%d, vgroup info before move, replica:%d", newVg.vgId, pTrans->id, newVg.replica);
16,826✔
2140
  for (int32_t i = 0; i < newVg.replica; ++i) {
54,406✔
2141
    mInfo("vgId:%d, trans:%d, vnode:%d dnode:%d", newVg.vgId, pTrans->id, i, newVg.vnodeGid[i].dnodeId);
37,580✔
2142
  }
2143

2144
  if (!force) {
16,826✔
2145
#if 1
2146
    {
2147
#else
2148
    if (newVg.replica == 1) {
2149
#endif
2150
      mInfo("vgId:%d, trans:%d, will add 1 vnode, replca:%d", pVgroup->vgId, pTrans->id, newVg.replica);
16,826✔
2151
      TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVg, pArray));
16,826✔
2152
      for (int32_t i = 0; i < newVg.replica - 1; ++i) {
54,406✔
2153
        TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId));
37,580✔
2154
      }
2155
      TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg, &newVg.vnodeGid[newVg.replica - 1]));
16,826✔
2156
      TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg));
16,826✔
2157

2158
      mInfo("vgId:%d, trans:%d, will remove 1 vnode, replca:2", pVgroup->vgId, pTrans->id);
16,826✔
2159
      newVg.replica--;
16,826✔
2160
      SVnodeGid del = newVg.vnodeGid[vnIndex];
16,826✔
2161
      newVg.vnodeGid[vnIndex] = newVg.vnodeGid[newVg.replica];
16,826✔
2162
      memset(&newVg.vnodeGid[newVg.replica], 0, sizeof(SVnodeGid));
16,826✔
2163
      {
2164
        SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
16,826✔
2165
        if (pRaw == NULL) {
16,826✔
2166
          code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2167
          if (terrno != 0) code = terrno;
×
2168
          TAOS_RETURN(code);
×
2169
        }
2170
        if ((code = mndTransAppendGroupRedolog(pTrans, pRaw, pVgroup->vgId)) != 0) {
16,826✔
2171
          sdbFreeRaw(pRaw);
×
2172
          TAOS_RETURN(code);
×
2173
        }
2174
        code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
16,826✔
2175
        if (code != 0) {
16,826✔
2176
          mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2177
          return code;
×
2178
        }
2179
      }
2180

2181
      TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pDb, &newVg, &del, true));
16,826✔
2182
      for (int32_t i = 0; i < newVg.replica; ++i) {
54,406✔
2183
        TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId));
37,580✔
2184
      }
2185
      TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg));
16,826✔
2186
#if 1
2187
    }
2188
#else
2189
    } else {  // new replica == 3
2190
      mInfo("vgId:%d, will add 1 vnode, replca:3", pVgroup->vgId);
2191
      if (mndAddVnodeToVgroup(pMnode, pTrans, &newVg, pArray) != 0) return -1;
2192
      mInfo("vgId:%d, will remove 1 vnode, replca:4", pVgroup->vgId);
2193
      newVg.replica--;
2194
      SVnodeGid del = newVg.vnodeGid[vnIndex];
2195
      newVg.vnodeGid[vnIndex] = newVg.vnodeGid[newVg.replica];
2196
      memset(&newVg.vnodeGid[newVg.replica], 0, sizeof(SVnodeGid));
2197
      {
2198
        SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
2199
        if (pRaw == NULL) return -1;
2200
        if (mndTransAppendRedolog(pTrans, pRaw) != 0) {
2201
          sdbFreeRaw(pRaw);
2202
          return -1;
2203
        }
2204
      }
2205

2206
      if (mndAddDropVnodeAction(pMnode, pTrans, pDb, &newVg, &del, true) != 0) return -1;
2207
      for (int32_t i = 0; i < newVg.replica; ++i) {
2208
        if (i == vnIndex) continue;
2209
        if (mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId) != 0) return -1;
2210
      }
2211
      if (mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg, &newVg.vnodeGid[vnIndex]) != 0) return -1;
2212
      if (mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg) != 0) return -1;
2213
    }
2214
#endif
2215
  } else {
2216
    mInfo("vgId:%d, will add 1 vnode and force remove 1 vnode", pVgroup->vgId);
×
2217
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVg, pArray));
×
2218
    newVg.replica--;
×
2219
    // SVnodeGid del = newVg.vnodeGid[vnIndex];
2220
    newVg.vnodeGid[vnIndex] = newVg.vnodeGid[newVg.replica];
×
2221
    memset(&newVg.vnodeGid[newVg.replica], 0, sizeof(SVnodeGid));
×
2222
    {
2223
      SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
×
2224
      if (pRaw == NULL) {
×
2225
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2226
        if (terrno != 0) code = terrno;
×
2227
        TAOS_RETURN(code);
×
2228
      }
2229
      if ((code = mndTransAppendGroupRedolog(pTrans, pRaw, pVgroup->vgId)) != 0) {
×
2230
        sdbFreeRaw(pRaw);
×
2231
        TAOS_RETURN(code);
×
2232
      }
2233
      code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
×
2234
      if (code != 0) {
×
2235
        mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2236
        return code;
×
2237
      }
2238
    }
2239

2240
    for (int32_t i = 0; i < newVg.replica; ++i) {
×
2241
      if (i != vnIndex) {
×
2242
        TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg, newVg.vnodeGid[i].dnodeId));
×
2243
      }
2244
    }
2245
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg, &newVg.vnodeGid[vnIndex]));
×
2246
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg));
×
2247

2248
    if (newVg.replica == 1) {
×
2249
      if (force && !unsafe) {
×
2250
        TAOS_RETURN(TSDB_CODE_VND_META_DATA_UNSAFE_DELETE);
×
2251
      }
2252

2253
      SSdb *pSdb = pMnode->pSdb;
×
2254
      void *pIter = NULL;
×
2255

2256
      while (1) {
×
2257
        SStbObj *pStb = NULL;
×
2258
        pIter = sdbFetch(pSdb, SDB_STB, pIter, (void **)&pStb);
×
2259
        if (pIter == NULL) break;
×
2260

2261
        if (strcmp(pStb->db, pDb->name) == 0) {
×
2262
          if ((code = mndSetForceDropCreateStbRedoActions(pMnode, pTrans, &newVg, pStb)) != 0) {
×
2263
            sdbCancelFetch(pSdb, pIter);
×
2264
            sdbRelease(pSdb, pStb);
×
2265
            TAOS_RETURN(code);
×
2266
          }
2267
        }
2268

2269
        sdbRelease(pSdb, pStb);
×
2270
      }
2271

2272
      mInfo("vgId:%d, all data is dropped since replica=1", pVgroup->vgId);
×
2273
    }
2274
  }
2275

2276
  {
2277
    SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
16,826✔
2278
    if (pRaw == NULL) {
16,826✔
2279
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2280
      if (terrno != 0) code = terrno;
×
2281
      TAOS_RETURN(code);
×
2282
    }
2283
    if ((code = mndTransAppendCommitlog(pTrans, pRaw)) != 0) {
16,826✔
2284
      sdbFreeRaw(pRaw);
×
2285
      TAOS_RETURN(code);
×
2286
    }
2287
    code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
16,826✔
2288
    if (code != 0) {
16,826✔
2289
      mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2290
      return code;
×
2291
    }
2292
  }
2293

2294
  mInfo("vgId:%d, vgroup info after move, replica:%d", newVg.vgId, newVg.replica);
16,826✔
2295
  for (int32_t i = 0; i < newVg.replica; ++i) {
54,406✔
2296
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
37,580✔
2297
  }
2298
  TAOS_RETURN(code);
16,826✔
2299
}
2300

2301
int32_t mndSetMoveVgroupsInfoToTrans(SMnode *pMnode, STrans *pTrans, int32_t delDnodeId, bool force, bool unsafe) {
8,317✔
2302
  int32_t code = 0;
8,317✔
2303
  SArray *pArray = mndBuildDnodesArray(pMnode, delDnodeId, NULL);
8,317✔
2304
  if (pArray == NULL) {
8,317✔
2305
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2306
    if (terrno != 0) code = terrno;
×
2307
    TAOS_RETURN(code);
×
2308
  }
2309

2310
  void *pIter = NULL;
8,317✔
2311
  while (1) {
24,112✔
2312
    SVgObj *pVgroup = NULL;
32,429✔
2313
    pIter = sdbFetch(pMnode->pSdb, SDB_VGROUP, pIter, (void **)&pVgroup);
32,429✔
2314
    if (pIter == NULL) break;
32,429✔
2315

2316
    int32_t vnIndex = -1;
24,112✔
2317
    for (int32_t i = 0; i < pVgroup->replica; ++i) {
46,618✔
2318
      if (pVgroup->vnodeGid[i].dnodeId == delDnodeId) {
39,332✔
2319
        vnIndex = i;
16,826✔
2320
        break;
16,826✔
2321
      }
2322
    }
2323

2324
    code = 0;
24,112✔
2325
    if (vnIndex != -1) {
24,112✔
2326
      mInfo("vgId:%d, trans:%d, vnode:%d will be removed from dnode:%d, force:%d", pVgroup->vgId, pTrans->id, vnIndex,
16,826✔
2327
            delDnodeId, force);
2328
      SDbObj *pDb = mndAcquireDb(pMnode, pVgroup->dbName);
16,826✔
2329
      code = mndSetMoveVgroupInfoToTrans(pMnode, pTrans, pDb, pVgroup, vnIndex, pArray, force, unsafe);
16,826✔
2330
      mndReleaseDb(pMnode, pDb);
16,826✔
2331
    }
2332

2333
    sdbRelease(pMnode->pSdb, pVgroup);
24,112✔
2334

2335
    if (code != 0) {
24,112✔
2336
      sdbCancelFetch(pMnode->pSdb, pIter);
×
2337
      break;
×
2338
    }
2339
  }
2340

2341
  taosArrayDestroy(pArray);
8,317✔
2342
  TAOS_RETURN(code);
8,317✔
2343
}
2344

2345
static int32_t mndAddIncVgroupReplicaToTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
64,914✔
2346
                                             int32_t newDnodeId) {
2347
  int32_t code = 0;
64,914✔
2348
  mInfo("vgId:%d, will add 1 vnode, replica:%d dnode:%d", pVgroup->vgId, pVgroup->replica, newDnodeId);
64,914✔
2349

2350
  // assoc dnode
2351
  SVnodeGid *pGid = &pVgroup->vnodeGid[pVgroup->replica];
64,914✔
2352
  pVgroup->replica++;
64,914✔
2353
  pGid->dnodeId = newDnodeId;
64,914✔
2354
  pGid->syncState = TAOS_SYNC_STATE_OFFLINE;
64,914✔
2355
  pGid->nodeRole = TAOS_SYNC_ROLE_LEARNER;
64,914✔
2356

2357
  SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
64,914✔
2358
  if (pVgRaw == NULL) {
64,914✔
2359
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2360
    if (terrno != 0) code = terrno;
×
2361
    TAOS_RETURN(code);
×
2362
  }
2363
  if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
64,914✔
2364
    sdbFreeRaw(pVgRaw);
×
2365
    TAOS_RETURN(code);
×
2366
  }
2367
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
64,914✔
2368
  if (code != 0) {
64,914✔
2369
    mError("vgId:%d, failed to set raw status since %s at line:%d", pVgroup->vgId, tstrerror(code), __LINE__);
×
2370
    TAOS_RETURN(code);
×
2371
  }
2372

2373
  // learner
2374
  for (int32_t i = 0; i < pVgroup->replica - 1; ++i) {
216,336✔
2375
    TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, pVgroup, pVgroup->vnodeGid[i].dnodeId));
151,422✔
2376
  }
2377
  TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pDb, pVgroup, pGid));
64,914✔
2378

2379
  // voter
2380
  pGid->nodeRole = TAOS_SYNC_ROLE_VOTER;
64,914✔
2381
  TAOS_CHECK_RETURN(mndAddAlterVnodeTypeAction(pMnode, pTrans, pDb, pVgroup, pGid->dnodeId));
64,914✔
2382
  for (int32_t i = 0; i < pVgroup->replica - 1; ++i) {
216,336✔
2383
    TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, pVgroup, pVgroup->vnodeGid[i].dnodeId));
151,422✔
2384
  }
2385

2386
  // confirm
2387
  TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, pVgroup));
64,914✔
2388

2389
  TAOS_RETURN(code);
64,914✔
2390
}
2391

2392
static int32_t mndAddDecVgroupReplicaFromTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
64,914✔
2393
                                               int32_t delDnodeId) {
2394
  int32_t code = 0;
64,914✔
2395
  mInfo("vgId:%d, will remove 1 vnode, replica:%d dnode:%d", pVgroup->vgId, pVgroup->replica, delDnodeId);
64,914✔
2396

2397
  SVnodeGid *pGid = NULL;
64,914✔
2398
  SVnodeGid  delGid = {0};
64,914✔
2399
  for (int32_t i = 0; i < pVgroup->replica; ++i) {
110,218✔
2400
    if (pVgroup->vnodeGid[i].dnodeId == delDnodeId) {
110,218✔
2401
      pGid = &pVgroup->vnodeGid[i];
64,914✔
2402
      break;
64,914✔
2403
    }
2404
  }
2405

2406
  if (pGid == NULL) return 0;
64,914✔
2407

2408
  pVgroup->replica--;
64,914✔
2409
  memcpy(&delGid, pGid, sizeof(SVnodeGid));
64,914✔
2410
  memcpy(pGid, &pVgroup->vnodeGid[pVgroup->replica], sizeof(SVnodeGid));
64,914✔
2411
  memset(&pVgroup->vnodeGid[pVgroup->replica], 0, sizeof(SVnodeGid));
64,914✔
2412

2413
  SSdbRaw *pVgRaw = mndVgroupActionEncode(pVgroup);
64,914✔
2414
  if (pVgRaw == NULL) {
64,914✔
2415
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2416
    if (terrno != 0) code = terrno;
×
2417
    TAOS_RETURN(code);
×
2418
  }
2419
  if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
64,914✔
2420
    sdbFreeRaw(pVgRaw);
×
2421
    TAOS_RETURN(code);
×
2422
  }
2423
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
64,914✔
2424
  if (code != 0) {
64,914✔
2425
    mError("vgId:%d, failed to set raw status since %s at line:%d", pVgroup->vgId, tstrerror(code), __LINE__);
×
2426
    TAOS_RETURN(code);
×
2427
  }
2428

2429
  TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pDb, pVgroup, &delGid, true));
64,914✔
2430
  for (int32_t i = 0; i < pVgroup->replica; ++i) {
216,336✔
2431
    TAOS_CHECK_RETURN(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, pVgroup, pVgroup->vnodeGid[i].dnodeId));
151,422✔
2432
  }
2433
  TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, pVgroup));
64,914✔
2434

2435
  TAOS_RETURN(code);
64,914✔
2436
}
2437

2438
static int32_t mndRedistributeVgroup(SMnode *pMnode, SRpcMsg *pReq, SDbObj *pDb, SVgObj *pVgroup, SDnodeObj *pNew1,
37,944✔
2439
                                     SDnodeObj *pOld1, SDnodeObj *pNew2, SDnodeObj *pOld2, SDnodeObj *pNew3,
2440
                                     SDnodeObj *pOld3) {
2441
  int32_t code = -1;
37,944✔
2442
  STrans *pTrans = NULL;
37,944✔
2443

2444
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_GLOBAL, pReq, "red-vgroup");
37,944✔
2445
  if (pTrans == NULL) {
37,944✔
2446
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2447
    if (terrno != 0) code = terrno;
×
2448
    goto _OVER;
×
2449
  }
2450

2451
  mndTransSetDbName(pTrans, pVgroup->dbName, NULL);
37,944✔
2452
  TAOS_CHECK_GOTO(mndTransCheckConflictWithCompact(pMnode, pTrans), NULL, _OVER);
37,944✔
2453
  TAOS_CHECK_GOTO(mndTransCheckConflictWithRetention(pMnode, pTrans), NULL, _OVER);
37,674✔
2454

2455
  mndTransSetSerial(pTrans);
37,674✔
2456
  mInfo("trans:%d, used to redistribute vgroup, vgId:%d", pTrans->id, pVgroup->vgId);
37,674✔
2457

2458
  SVgObj newVg = {0};
37,674✔
2459
  memcpy(&newVg, pVgroup, sizeof(SVgObj));
37,674✔
2460
  mInfo("vgId:%d, vgroup info before redistribute, replica:%d", newVg.vgId, newVg.replica);
37,674✔
2461
  for (int32_t i = 0; i < newVg.replica; ++i) {
124,912✔
2462
    mInfo("vgId:%d, vnode:%d dnode:%d role:%s", newVg.vgId, i, newVg.vnodeGid[i].dnodeId,
87,238✔
2463
          syncStr(newVg.vnodeGid[i].syncState));
2464
  }
2465

2466
  if (pNew1 != NULL && pOld1 != NULL) {
37,674✔
2467
    int32_t numOfVnodes = mndGetVnodesNum(pMnode, pNew1->id);
37,674✔
2468
    if (numOfVnodes >= pNew1->numOfSupportVnodes) {
37,674✔
2469
      mError("vgId:%d, no enough vnodes in dnode:%d, numOfVnodes:%d support:%d", newVg.vgId, pNew1->id, numOfVnodes,
711✔
2470
             pNew1->numOfSupportVnodes);
2471
      code = TSDB_CODE_MND_NO_ENOUGH_VNODES;
711✔
2472
      goto _OVER;
711✔
2473
    }
2474

2475
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
36,963✔
2476
    if (pNew1->memAvail - vgMem - pNew1->memUsed <= 0) {
36,963✔
2477
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
2478
             pVgroup->dbName, pVgroup->vgId, vgMem, pNew1->id, pNew1->memAvail, pNew1->memUsed);
2479
      code = TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE;
×
2480
      goto _OVER;
×
2481
    } else {
2482
      pNew1->memUsed += vgMem;
36,963✔
2483
    }
2484

2485
    TAOS_CHECK_GOTO(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pNew1->id), NULL, _OVER);
36,963✔
2486
    TAOS_CHECK_GOTO(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pOld1->id), NULL, _OVER);
36,963✔
2487
  }
2488

2489
  if (pNew2 != NULL && pOld2 != NULL) {
36,963✔
2490
    int32_t numOfVnodes = mndGetVnodesNum(pMnode, pNew2->id);
9,839✔
2491
    if (numOfVnodes >= pNew2->numOfSupportVnodes) {
9,839✔
2492
      mError("vgId:%d, no enough vnodes in dnode:%d, numOfVnodes:%d support:%d", newVg.vgId, pNew2->id, numOfVnodes,
×
2493
             pNew2->numOfSupportVnodes);
2494
      code = TSDB_CODE_MND_NO_ENOUGH_VNODES;
×
2495
      goto _OVER;
×
2496
    }
2497
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
9,839✔
2498
    if (pNew2->memAvail - vgMem - pNew2->memUsed <= 0) {
9,839✔
2499
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
2500
             pVgroup->dbName, pVgroup->vgId, vgMem, pNew2->id, pNew2->memAvail, pNew2->memUsed);
2501
      code = TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE;
×
2502
      goto _OVER;
×
2503
    } else {
2504
      pNew2->memUsed += vgMem;
9,839✔
2505
    }
2506
    TAOS_CHECK_GOTO(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pNew2->id), NULL, _OVER);
9,839✔
2507
    TAOS_CHECK_GOTO(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pOld2->id), NULL, _OVER);
9,839✔
2508
  }
2509

2510
  if (pNew3 != NULL && pOld3 != NULL) {
36,963✔
2511
    int32_t numOfVnodes = mndGetVnodesNum(pMnode, pNew3->id);
2,857✔
2512
    if (numOfVnodes >= pNew3->numOfSupportVnodes) {
2,857✔
2513
      mError("vgId:%d, no enough vnodes in dnode:%d, numOfVnodes:%d support:%d", newVg.vgId, pNew3->id, numOfVnodes,
×
2514
             pNew3->numOfSupportVnodes);
2515
      code = TSDB_CODE_MND_NO_ENOUGH_VNODES;
×
2516
      goto _OVER;
×
2517
    }
2518
    int64_t vgMem = mndGetVgroupMemory(pMnode, NULL, pVgroup);
2,857✔
2519
    if (pNew3->memAvail - vgMem - pNew3->memUsed <= 0) {
2,857✔
2520
      mError("db:%s, vgId:%d, no enough memory:%" PRId64 " in dnode:%d avail:%" PRId64 " used:%" PRId64,
×
2521
             pVgroup->dbName, pVgroup->vgId, vgMem, pNew3->id, pNew3->memAvail, pNew3->memUsed);
2522
      code = TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE;
×
2523
      goto _OVER;
×
2524
    } else {
2525
      pNew3->memUsed += vgMem;
2,857✔
2526
    }
2527
    TAOS_CHECK_GOTO(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pNew3->id), NULL, _OVER);
2,857✔
2528
    TAOS_CHECK_GOTO(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pOld3->id), NULL, _OVER);
2,857✔
2529
  }
2530

2531
  {
2532
    SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
36,963✔
2533
    if (pRaw == NULL) {
36,963✔
2534
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2535
      if (terrno != 0) code = terrno;
×
2536
      goto _OVER;
×
2537
    }
2538
    if ((code = mndTransAppendCommitlog(pTrans, pRaw)) != 0) {
36,963✔
2539
      sdbFreeRaw(pRaw);
×
2540
      goto _OVER;
×
2541
    }
2542
    code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
36,963✔
2543
    if (code != 0) {
36,963✔
2544
      mError("vgId:%d, failed to set raw status since %s at line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
2545
      goto _OVER;
×
2546
    }
2547
  }
2548

2549
  mInfo("vgId:%d, vgroup info after redistribute, replica:%d", newVg.vgId, newVg.replica);
36,963✔
2550
  for (int32_t i = 0; i < newVg.replica; ++i) {
122,068✔
2551
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
85,105✔
2552
  }
2553

2554
  TAOS_CHECK_GOTO(mndTransPrepare(pMnode, pTrans), NULL, _OVER);
36,963✔
2555
  code = 0;
34,246✔
2556

2557
_OVER:
37,944✔
2558
  mndTransDrop(pTrans);
37,944✔
2559
  mndReleaseDb(pMnode, pDb);
37,944✔
2560
  TAOS_RETURN(code);
37,944✔
2561
}
2562

2563
static int32_t mndProcessRedistributeVgroupMsg(SRpcMsg *pReq) {
45,811✔
2564
  SMnode    *pMnode = pReq->info.node;
45,811✔
2565
  SDnodeObj *pNew1 = NULL;
45,811✔
2566
  SDnodeObj *pNew2 = NULL;
45,811✔
2567
  SDnodeObj *pNew3 = NULL;
45,811✔
2568
  SDnodeObj *pOld1 = NULL;
45,811✔
2569
  SDnodeObj *pOld2 = NULL;
45,811✔
2570
  SDnodeObj *pOld3 = NULL;
45,811✔
2571
  SVgObj    *pVgroup = NULL;
45,811✔
2572
  SDbObj    *pDb = NULL;
45,811✔
2573
  int32_t    code = -1;
45,811✔
2574
  int64_t    curMs = taosGetTimestampMs();
45,811✔
2575
  int32_t    newDnodeId[3] = {0};
45,811✔
2576
  int32_t    oldDnodeId[3] = {0};
45,811✔
2577
  int32_t    newIndex = -1;
45,811✔
2578
  int32_t    oldIndex = -1;
45,811✔
2579

2580
  SRedistributeVgroupReq req = {0};
45,811✔
2581
  if (tDeserializeSRedistributeVgroupReq(pReq->pCont, pReq->contLen, &req) != 0) {
45,811✔
2582
    code = TSDB_CODE_INVALID_MSG;
×
2583
    goto _OVER;
×
2584
  }
2585

2586
  mInfo("vgId:%d, start to redistribute vgroup to dnode %d:%d:%d", req.vgId, req.dnodeId1, req.dnodeId2, req.dnodeId3);
45,811✔
2587
  if ((code = mndCheckOperPrivilege(pMnode, pReq->info.conn.user, MND_OPER_REDISTRIBUTE_VGROUP)) != 0) {
45,811✔
2588
    goto _OVER;
349✔
2589
  }
2590

2591
  pVgroup = mndAcquireVgroup(pMnode, req.vgId);
45,462✔
2592
  if (pVgroup == NULL) {
45,462✔
2593
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
2,133✔
2594
    if (terrno != 0) code = terrno;
2,133✔
2595
    goto _OVER;
2,133✔
2596
  }
2597
  if (pVgroup->mountVgId) {
43,329✔
2598
    code = TSDB_CODE_MND_MOUNT_OBJ_NOT_SUPPORT;
×
2599
    goto _OVER;
×
2600
  }
2601
  pDb = mndAcquireDb(pMnode, pVgroup->dbName);
43,329✔
2602
  if (pDb == NULL) {
43,329✔
2603
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2604
    if (terrno != 0) code = terrno;
×
2605
    goto _OVER;
×
2606
  }
2607

2608
  if (pVgroup->replica == 1) {
43,329✔
2609
    if (req.dnodeId1 <= 0 || req.dnodeId2 > 0 || req.dnodeId3 > 0) {
12,480✔
2610
      code = TSDB_CODE_MND_INVALID_REPLICA;
×
2611
      goto _OVER;
×
2612
    }
2613

2614
    if (req.dnodeId1 == pVgroup->vnodeGid[0].dnodeId) {
12,480✔
2615
      // terrno = TSDB_CODE_MND_VGROUP_UN_CHANGED;
2616
      code = 0;
×
2617
      goto _OVER;
×
2618
    }
2619

2620
    pNew1 = mndAcquireDnode(pMnode, req.dnodeId1);
12,480✔
2621
    if (pNew1 == NULL) {
12,480✔
2622
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2623
      if (terrno != 0) code = terrno;
×
2624
      goto _OVER;
×
2625
    }
2626
    if (!mndIsDnodeOnline(pNew1, curMs)) {
12,480✔
2627
      code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2628
      goto _OVER;
×
2629
    }
2630

2631
    pOld1 = mndAcquireDnode(pMnode, pVgroup->vnodeGid[0].dnodeId);
12,480✔
2632
    if (pOld1 == NULL) {
12,480✔
2633
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2634
      if (terrno != 0) code = terrno;
×
2635
      goto _OVER;
×
2636
    }
2637
    if (!mndIsDnodeOnline(pOld1, curMs)) {
12,480✔
2638
      code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
41✔
2639
      goto _OVER;
41✔
2640
    }
2641

2642
    code = mndRedistributeVgroup(pMnode, pReq, pDb, pVgroup, pNew1, pOld1, NULL, NULL, NULL, NULL);
12,439✔
2643

2644
  } else if (pVgroup->replica == 3) {
30,849✔
2645
    if (req.dnodeId1 <= 0 || req.dnodeId2 <= 0 || req.dnodeId3 <= 0) {
29,403✔
2646
      code = TSDB_CODE_MND_INVALID_REPLICA;
2,844✔
2647
      goto _OVER;
2,844✔
2648
    }
2649

2650
    if (req.dnodeId1 == req.dnodeId2 || req.dnodeId1 == req.dnodeId3 || req.dnodeId2 == req.dnodeId3) {
26,559✔
2651
      code = TSDB_CODE_MND_INVALID_REPLICA;
711✔
2652
      goto _OVER;
711✔
2653
    }
2654

2655
    if (req.dnodeId1 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId1 != pVgroup->vnodeGid[1].dnodeId &&
25,848✔
2656
        req.dnodeId1 != pVgroup->vnodeGid[2].dnodeId) {
10,657✔
2657
      newDnodeId[++newIndex] = req.dnodeId1;
9,235✔
2658
      mInfo("vgId:%d, dnode:%d will be added, index:%d", pVgroup->vgId, newDnodeId[newIndex], newIndex);
9,235✔
2659
    }
2660

2661
    if (req.dnodeId2 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[1].dnodeId &&
25,848✔
2662
        req.dnodeId2 != pVgroup->vnodeGid[2].dnodeId) {
16,231✔
2663
      newDnodeId[++newIndex] = req.dnodeId2;
11,265✔
2664
      mInfo("vgId:%d, dnode:%d will be added, index:%d", pVgroup->vgId, newDnodeId[newIndex], newIndex);
11,265✔
2665
    }
2666

2667
    if (req.dnodeId3 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId3 != pVgroup->vnodeGid[1].dnodeId &&
25,848✔
2668
        req.dnodeId3 != pVgroup->vnodeGid[2].dnodeId) {
20,171✔
2669
      newDnodeId[++newIndex] = req.dnodeId3;
15,547✔
2670
      mInfo("vgId:%d, dnode:%d will be added, index:%d", pVgroup->vgId, newDnodeId[newIndex], newIndex);
15,547✔
2671
    }
2672

2673
    if (req.dnodeId1 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[0].dnodeId &&
25,848✔
2674
        req.dnodeId3 != pVgroup->vnodeGid[0].dnodeId) {
15,596✔
2675
      oldDnodeId[++oldIndex] = pVgroup->vnodeGid[0].dnodeId;
12,041✔
2676
      mInfo("vgId:%d, dnode:%d will be removed, index:%d", pVgroup->vgId, oldDnodeId[oldIndex], oldIndex);
12,041✔
2677
    }
2678

2679
    if (req.dnodeId1 != pVgroup->vnodeGid[1].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[1].dnodeId &&
25,848✔
2680
        req.dnodeId3 != pVgroup->vnodeGid[1].dnodeId) {
11,292✔
2681
      oldDnodeId[++oldIndex] = pVgroup->vnodeGid[1].dnodeId;
9,170✔
2682
      mInfo("vgId:%d, dnode:%d will be removed, index:%d", pVgroup->vgId, oldDnodeId[oldIndex], oldIndex);
9,170✔
2683
    }
2684

2685
    if (req.dnodeId1 != pVgroup->vnodeGid[2].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[2].dnodeId &&
25,848✔
2686
        req.dnodeId3 != pVgroup->vnodeGid[2].dnodeId) {
19,460✔
2687
      oldDnodeId[++oldIndex] = pVgroup->vnodeGid[2].dnodeId;
14,836✔
2688
      mInfo("vgId:%d, dnode:%d will be removed, index:%d", pVgroup->vgId, oldDnodeId[oldIndex], oldIndex);
14,836✔
2689
    }
2690

2691
    if (newDnodeId[0] != 0) {
25,848✔
2692
      pNew1 = mndAcquireDnode(pMnode, newDnodeId[0]);
24,779✔
2693
      if (pNew1 == NULL) {
24,779✔
2694
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2695
        if (terrno != 0) code = terrno;
×
2696
        goto _OVER;
×
2697
      }
2698
      if (!mndIsDnodeOnline(pNew1, curMs)) {
24,779✔
2699
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
720✔
2700
        goto _OVER;
720✔
2701
      }
2702
    }
2703

2704
    if (newDnodeId[1] != 0) {
25,128✔
2705
      pNew2 = mndAcquireDnode(pMnode, newDnodeId[1]);
8,393✔
2706
      if (pNew2 == NULL) {
8,393✔
2707
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2708
        if (terrno != 0) code = terrno;
×
2709
        goto _OVER;
×
2710
      }
2711
      if (!mndIsDnodeOnline(pNew2, curMs)) {
8,393✔
2712
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2713
        goto _OVER;
×
2714
      }
2715
    }
2716

2717
    if (newDnodeId[2] != 0) {
25,128✔
2718
      pNew3 = mndAcquireDnode(pMnode, newDnodeId[2]);
2,857✔
2719
      if (pNew3 == NULL) {
2,857✔
2720
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2721
        if (terrno != 0) code = terrno;
×
2722
        goto _OVER;
×
2723
      }
2724
      if (!mndIsDnodeOnline(pNew3, curMs)) {
2,857✔
2725
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2726
        goto _OVER;
×
2727
      }
2728
    }
2729

2730
    if (oldDnodeId[0] != 0) {
25,128✔
2731
      pOld1 = mndAcquireDnode(pMnode, oldDnodeId[0]);
24,059✔
2732
      if (pOld1 == NULL) {
24,059✔
2733
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2734
        if (terrno != 0) code = terrno;
×
2735
        goto _OVER;
×
2736
      }
2737
      if (!mndIsDnodeOnline(pOld1, curMs)) {
24,059✔
UNCOV
2738
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
UNCOV
2739
        goto _OVER;
×
2740
      }
2741
    }
2742

2743
    if (oldDnodeId[1] != 0) {
25,128✔
2744
      pOld2 = mndAcquireDnode(pMnode, oldDnodeId[1]);
8,393✔
2745
      if (pOld2 == NULL) {
8,393✔
2746
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2747
        if (terrno != 0) code = terrno;
×
2748
        goto _OVER;
×
2749
      }
2750
      if (!mndIsDnodeOnline(pOld2, curMs)) {
8,393✔
2751
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2752
        goto _OVER;
×
2753
      }
2754
    }
2755

2756
    if (oldDnodeId[2] != 0) {
25,128✔
2757
      pOld3 = mndAcquireDnode(pMnode, oldDnodeId[2]);
2,857✔
2758
      if (pOld3 == NULL) {
2,857✔
2759
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2760
        if (terrno != 0) code = terrno;
×
2761
        goto _OVER;
×
2762
      }
2763
      if (!mndIsDnodeOnline(pOld3, curMs)) {
2,857✔
2764
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2765
        goto _OVER;
×
2766
      }
2767
    }
2768

2769
    if (pNew1 == NULL && pOld1 == NULL && pNew2 == NULL && pOld2 == NULL && pNew3 == NULL && pOld3 == NULL) {
25,128✔
2770
      // terrno = TSDB_CODE_MND_VGROUP_UN_CHANGED;
2771
      code = 0;
1,069✔
2772
      goto _OVER;
1,069✔
2773
    }
2774

2775
    code = mndRedistributeVgroup(pMnode, pReq, pDb, pVgroup, pNew1, pOld1, pNew2, pOld2, pNew3, pOld3);
24,059✔
2776

2777
  } else if (pVgroup->replica == 2) {
1,446✔
2778
    if (req.dnodeId1 <= 0 || req.dnodeId2 <= 0) {
1,446✔
2779
      code = TSDB_CODE_MND_INVALID_REPLICA;
×
2780
      goto _OVER;
×
2781
    }
2782

2783
    if (req.dnodeId1 == req.dnodeId2) {
1,446✔
2784
      code = TSDB_CODE_MND_INVALID_REPLICA;
×
2785
      goto _OVER;
×
2786
    }
2787

2788
    if (req.dnodeId1 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId1 != pVgroup->vnodeGid[1].dnodeId) {
1,446✔
2789
      newDnodeId[++newIndex] = req.dnodeId1;
1,446✔
2790
      mInfo("vgId:%d, dnode:%d will be added, index:%d", pVgroup->vgId, newDnodeId[newIndex], newIndex);
1,446✔
2791
    }
2792

2793
    if (req.dnodeId2 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[1].dnodeId) {
1,446✔
2794
      newDnodeId[++newIndex] = req.dnodeId2;
1,446✔
2795
      mInfo("vgId:%d, dnode:%d will be added, index:%d", pVgroup->vgId, newDnodeId[newIndex], newIndex);
1,446✔
2796
    }
2797

2798
    if (req.dnodeId1 != pVgroup->vnodeGid[0].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[0].dnodeId) {
1,446✔
2799
      oldDnodeId[++oldIndex] = pVgroup->vnodeGid[0].dnodeId;
1,446✔
2800
      mInfo("vgId:%d, dnode:%d will be removed, index:%d", pVgroup->vgId, oldDnodeId[oldIndex], oldIndex);
1,446✔
2801
    }
2802

2803
    if (req.dnodeId1 != pVgroup->vnodeGid[1].dnodeId && req.dnodeId2 != pVgroup->vnodeGid[1].dnodeId) {
1,446✔
2804
      oldDnodeId[++oldIndex] = pVgroup->vnodeGid[1].dnodeId;
1,446✔
2805
      mInfo("vgId:%d, dnode:%d will be removed, index:%d", pVgroup->vgId, oldDnodeId[oldIndex], oldIndex);
1,446✔
2806
    }
2807

2808
    if (newDnodeId[0] != 0) {
1,446✔
2809
      pNew1 = mndAcquireDnode(pMnode, newDnodeId[0]);
1,446✔
2810
      if (pNew1 == NULL) {
1,446✔
2811
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2812
        if (terrno != 0) code = terrno;
×
2813
        goto _OVER;
×
2814
      }
2815
      if (!mndIsDnodeOnline(pNew1, curMs)) {
1,446✔
2816
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2817
        goto _OVER;
×
2818
      }
2819
    }
2820

2821
    if (newDnodeId[1] != 0) {
1,446✔
2822
      pNew2 = mndAcquireDnode(pMnode, newDnodeId[1]);
1,446✔
2823
      if (pNew2 == NULL) {
1,446✔
2824
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2825
        if (terrno != 0) code = terrno;
×
2826
        goto _OVER;
×
2827
      }
2828
      if (!mndIsDnodeOnline(pNew2, curMs)) {
1,446✔
2829
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2830
        goto _OVER;
×
2831
      }
2832
    }
2833

2834
    if (oldDnodeId[0] != 0) {
1,446✔
2835
      pOld1 = mndAcquireDnode(pMnode, oldDnodeId[0]);
1,446✔
2836
      if (pOld1 == NULL) {
1,446✔
2837
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2838
        if (terrno != 0) code = terrno;
×
2839
        goto _OVER;
×
2840
      }
2841
      if (!mndIsDnodeOnline(pOld1, curMs)) {
1,446✔
2842
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2843
        goto _OVER;
×
2844
      }
2845
    }
2846

2847
    if (oldDnodeId[1] != 0) {
1,446✔
2848
      pOld2 = mndAcquireDnode(pMnode, oldDnodeId[1]);
1,446✔
2849
      if (pOld2 == NULL) {
1,446✔
2850
        code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2851
        if (terrno != 0) code = terrno;
×
2852
        goto _OVER;
×
2853
      }
2854
      if (!mndIsDnodeOnline(pOld2, curMs)) {
1,446✔
2855
        code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
×
2856
        goto _OVER;
×
2857
      }
2858
    }
2859

2860
    if (pNew1 == NULL && pOld1 == NULL && pNew2 == NULL && pOld2 == NULL) {
1,446✔
2861
      // terrno = TSDB_CODE_MND_VGROUP_UN_CHANGED;
2862
      code = 0;
×
2863
      goto _OVER;
×
2864
    }
2865

2866
    code = mndRedistributeVgroup(pMnode, pReq, pDb, pVgroup, pNew1, pOld1, pNew2, pOld2, NULL, NULL);
1,446✔
2867
  } else {
2868
    code = TSDB_CODE_MND_REQ_REJECTED;
×
2869
    goto _OVER;
×
2870
  }
2871

2872
  if (code == 0) code = TSDB_CODE_ACTION_IN_PROGRESS;
37,944✔
2873

2874
  char obj[33] = {0};
37,944✔
2875
  (void)tsnprintf(obj, sizeof(obj), "%d", req.vgId);
37,944✔
2876

2877
  auditRecord(pReq, pMnode->clusterId, "RedistributeVgroup", "", obj, req.sql, req.sqlLen);
37,944✔
2878

2879
_OVER:
45,811✔
2880
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
45,811✔
2881
    mError("vgId:%d, failed to redistribute to dnode %d:%d:%d since %s", req.vgId, req.dnodeId1, req.dnodeId2,
10,496✔
2882
           req.dnodeId3, tstrerror(code));
2883
  }
2884

2885
  mndReleaseDnode(pMnode, pNew1);
45,811✔
2886
  mndReleaseDnode(pMnode, pNew2);
45,811✔
2887
  mndReleaseDnode(pMnode, pNew3);
45,811✔
2888
  mndReleaseDnode(pMnode, pOld1);
45,811✔
2889
  mndReleaseDnode(pMnode, pOld2);
45,811✔
2890
  mndReleaseDnode(pMnode, pOld3);
45,811✔
2891
  mndReleaseVgroup(pMnode, pVgroup);
45,811✔
2892
  mndReleaseDb(pMnode, pDb);
45,811✔
2893
  tFreeSRedistributeVgroupReq(&req);
45,811✔
2894

2895
  TAOS_RETURN(code);
45,811✔
2896
}
2897

2898
static void *mndBuildSForceBecomeFollowerReq(SMnode *pMnode, SVgObj *pVgroup, int32_t dnodeId, int32_t *pContLen) {
6,379✔
2899
  SForceBecomeFollowerReq balanceReq = {
6,379✔
2900
      .vgId = pVgroup->vgId,
6,379✔
2901
  };
2902

2903
  int32_t contLen = tSerializeSForceBecomeFollowerReq(NULL, 0, &balanceReq);
6,379✔
2904
  if (contLen < 0) {
6,379✔
2905
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2906
    return NULL;
×
2907
  }
2908
  contLen += sizeof(SMsgHead);
6,379✔
2909

2910
  void *pReq = taosMemoryMalloc(contLen);
6,379✔
2911
  if (pReq == NULL) {
6,379✔
2912
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2913
    return NULL;
×
2914
  }
2915

2916
  SMsgHead *pHead = pReq;
6,379✔
2917
  pHead->contLen = htonl(contLen);
6,379✔
2918
  pHead->vgId = htonl(pVgroup->vgId);
6,379✔
2919

2920
  if (tSerializeSForceBecomeFollowerReq((char *)pReq + sizeof(SMsgHead), contLen, &balanceReq) < 0) {
6,379✔
2921
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2922
    taosMemoryFree(pReq);
×
2923
    return NULL;
×
2924
  }
2925
  *pContLen = contLen;
6,379✔
2926
  return pReq;
6,379✔
2927
}
2928

2929
int32_t mndAddBalanceVgroupLeaderAction(SMnode *pMnode, STrans *pTrans, SVgObj *pVgroup, int32_t dnodeId) {
6,379✔
2930
  int32_t    code = 0;
6,379✔
2931
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
6,379✔
2932
  if (pDnode == NULL) {
6,379✔
2933
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2934
    if (terrno != 0) code = terrno;
×
2935
    TAOS_RETURN(code);
×
2936
  }
2937

2938
  STransAction action = {0};
6,379✔
2939
  action.epSet = mndGetDnodeEpset(pDnode);
6,379✔
2940
  mndReleaseDnode(pMnode, pDnode);
6,379✔
2941

2942
  int32_t contLen = 0;
6,379✔
2943
  void   *pReq = mndBuildSForceBecomeFollowerReq(pMnode, pVgroup, dnodeId, &contLen);
6,379✔
2944
  if (pReq == NULL) {
6,379✔
2945
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2946
    if (terrno != 0) code = terrno;
×
2947
    TAOS_RETURN(code);
×
2948
  }
2949

2950
  action.pCont = pReq;
6,379✔
2951
  action.contLen = contLen;
6,379✔
2952
  action.msgType = TDMT_SYNC_FORCE_FOLLOWER;
6,379✔
2953

2954
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
6,379✔
2955
    taosMemoryFree(pReq);
×
2956
    TAOS_RETURN(code);
×
2957
  }
2958

2959
  TAOS_RETURN(code);
6,379✔
2960
}
2961

2962
static void *mndBuildAlterVnodeElectBaselineReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId,
38,274✔
2963
                                          int32_t *pContLen, int32_t ms) {
2964
  SAlterVnodeElectBaselineReq alterReq = {
38,274✔
2965
      .vgId = pVgroup->vgId,
38,274✔
2966
      .electBaseLine = ms,
2967
  };
2968

2969
  int32_t contLen = tSerializeSAlterVnodeReplicaReq(NULL, 0, &alterReq);
38,274✔
2970
  if (contLen < 0) {
38,274✔
2971
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2972
    return NULL;
×
2973
  }
2974

2975
  void *pReq = taosMemoryMalloc(contLen);
38,274✔
2976
  if (pReq == NULL) {
38,274✔
2977
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2978
    return NULL;
×
2979
  }
2980

2981
  if (tSerializeSAlterVnodeReplicaReq(pReq, contLen, &alterReq) < 0) {
38,274✔
2982
    mError("vgId:%d, failed to serialize alter vnode req,since %s", alterReq.vgId, terrstr());
×
2983
    taosMemoryFree(pReq);
×
2984
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
2985
    return NULL;
×
2986
  }
2987
  *pContLen = contLen;
38,274✔
2988
  return pReq;
38,274✔
2989
}
2990

2991
static int32_t mndAddAlterVnodeElectionBaselineActionToTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int32_t dnodeId, int32_t ms) {
38,274✔
2992
  int32_t    code = 0;
38,274✔
2993
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
38,274✔
2994
  if (pDnode == NULL) {
38,274✔
2995
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
2996
    if (terrno != 0) code = terrno;
×
2997
    TAOS_RETURN(code);
×
2998
  }
2999

3000
  STransAction action = {0};
38,274✔
3001
  action.epSet = mndGetDnodeEpset(pDnode);
38,274✔
3002
  mndReleaseDnode(pMnode, pDnode);
38,274✔
3003

3004
  int32_t contLen = 0;
38,274✔
3005
  void   *pReq = mndBuildAlterVnodeElectBaselineReq(pMnode, pDb, pVgroup, dnodeId, &contLen, ms);
38,274✔
3006
  if (pReq == NULL) {
38,274✔
3007
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3008
    if (terrno != 0) code = terrno;
×
3009
    TAOS_RETURN(code);
×
3010
  }
3011

3012
  action.pCont = pReq;
38,274✔
3013
  action.contLen = contLen;
38,274✔
3014
  action.msgType = TDMT_VND_ALTER_ELECTBASELINE;
38,274✔
3015
  action.groupId = pVgroup->vgId;
38,274✔
3016

3017
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
38,274✔
3018
    taosMemoryFree(pReq);
×
3019
    TAOS_RETURN(code);
×
3020
  }
3021

3022
  TAOS_RETURN(code);
38,274✔
3023
}
3024

3025
static int32_t mndAddAlterVgroupElectionBaselineActionToTrans(SMnode *pMnode, SVgObj *pVgroup, STrans *pTrans, int32_t index){
12,758✔
3026
  int32_t code = 0;
12,758✔
3027
  SSdb   *pSdb = pMnode->pSdb;
12,758✔
3028

3029
  int32_t vgid = pVgroup->vgId;
12,758✔
3030
  int8_t  replica = pVgroup->replica;
12,758✔
3031

3032
  if (pVgroup->replica <= 1) {
12,758✔
3033
    mInfo("trans:%d, vgid:%d no need to balance, replica:%d", pTrans->id, vgid, replica);
×
3034
    return -1;
×
3035
  }
3036

3037
  for(int32_t i = 0; i < 3; i++){
51,032✔
3038
    if(i == index%3){
38,274✔
3039
      mInfo("trans:%d, balance leader to dnode:%d", pTrans->id, pVgroup->vnodeGid[i].dnodeId);
6,379✔
3040
      TAOS_CHECK_RETURN(mndAddAlterVnodeElectionBaselineActionToTrans(pMnode, pTrans, NULL, pVgroup,
6,379✔
3041
                                                                      pVgroup->vnodeGid[i].dnodeId, 1500));
3042
    }
3043
    else{
3044
    TAOS_CHECK_RETURN(
31,895✔
3045
        mndAddAlterVnodeElectionBaselineActionToTrans(pMnode, pTrans, NULL, pVgroup, pVgroup->vnodeGid[i].dnodeId, 5000));
3046
    }
3047
  }
3048
  return code; 
12,758✔
3049
}
3050

3051
int32_t mndAddVgroupBalanceToTrans(SMnode *pMnode, SVgObj *pVgroup, STrans *pTrans, int32_t index) {
6,845✔
3052
  int32_t code = 0;
6,845✔
3053
  SSdb   *pSdb = pMnode->pSdb;
6,845✔
3054

3055
  int32_t vgid = pVgroup->vgId;
6,845✔
3056
  int8_t  replica = pVgroup->replica;
6,845✔
3057

3058
  if (pVgroup->replica <= 1) {
6,845✔
3059
    mInfo("trans:%d, vgid:%d no need to balance, replica:%d", pTrans->id, vgid, replica);
8✔
3060
    return -1;
8✔
3061
  }
3062

3063
  int32_t dnodeId = 0;
6,837✔
3064

3065
  for (int i = 0; i < replica; i++) {
14,914✔
3066
    if (pVgroup->vnodeGid[i].syncState == TAOS_SYNC_STATE_LEADER) {
14,456✔
3067
      dnodeId = pVgroup->vnodeGid[i].dnodeId;
6,379✔
3068
      break;
6,379✔
3069
    }
3070
  }
3071

3072
  bool       exist = false;
6,837✔
3073
  bool       online = false;
6,837✔
3074
  int64_t    curMs = taosGetTimestampMs();
6,837✔
3075
  SDnodeObj *pDnode = mndAcquireDnode(pMnode, dnodeId);
6,837✔
3076
  if (pDnode != NULL) {
6,837✔
3077
    exist = true;
6,379✔
3078
    online = mndIsDnodeOnline(pDnode, curMs);
6,379✔
3079
    mndReleaseDnode(pMnode, pDnode);
6,379✔
3080
  }
3081

3082
  if (exist && online) {
13,216✔
3083
    mInfo("trans:%d, vgid:%d force drop leader from dnode:%d", pTrans->id, vgid, dnodeId);    
6,379✔
3084
    TAOS_CHECK_RETURN(mndAddAlterVgroupElectionBaselineActionToTrans(pMnode, pVgroup, pTrans, index));
6,379✔
3085

3086
    if ((code = mndAddBalanceVgroupLeaderAction(pMnode, pTrans, pVgroup, dnodeId)) != 0) {
6,379✔
3087
      mError("trans:%d, vgid:%d failed to be balanced to dnode:%d", pTrans->id, vgid, dnodeId);
×
3088
      TAOS_RETURN(code);
×
3089
    }
3090

3091
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, NULL, pVgroup));
6,379✔
3092

3093
    TAOS_CHECK_RETURN(mndAddAlterVgroupElectionBaselineActionToTrans(pMnode, pVgroup, pTrans, -1));
6,379✔
3094

3095
    SDbObj *pDb = mndAcquireDb(pMnode, pVgroup->dbName);
6,379✔
3096
    if (pDb == NULL) {
6,379✔
3097
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3098
      if (terrno != 0) code = terrno;
×
3099
      mError("trans:%d, vgid:%d failed to be balanced to dnode:%d, because db not exist", pTrans->id, vgid, dnodeId);
×
3100
      TAOS_RETURN(code);
×
3101
    }
3102

3103
    mndReleaseDb(pMnode, pDb);
6,379✔
3104
  } else {
3105
    mInfo("trans:%d, vgid:%d cant be balanced to dnode:%d, exist:%d, online:%d", pTrans->id, vgid, dnodeId, exist,
458✔
3106
          online);
3107
  }
3108

3109
  TAOS_RETURN(code);
6,837✔
3110
}
3111

3112
extern int32_t mndProcessVgroupBalanceLeaderMsgImp(SRpcMsg *pReq);
3113

3114
int32_t mndProcessVgroupBalanceLeaderMsg(SRpcMsg *pReq) { return mndProcessVgroupBalanceLeaderMsgImp(pReq); }
2,466✔
3115

3116
#ifndef TD_ENTERPRISE
3117
int32_t mndProcessVgroupBalanceLeaderMsgImp(SRpcMsg *pReq) { return 0; }
3118
#endif
3119

3120
static int32_t mndCheckDnodeMemory(SMnode *pMnode, SDbObj *pOldDb, SDbObj *pNewDb, SVgObj *pOldVgroup,
208,644✔
3121
                                   SVgObj *pNewVgroup, SArray *pArray) {
3122
  for (int32_t i = 0; i < (int32_t)taosArrayGetSize(pArray); ++i) {
606,180✔
3123
    SDnodeObj *pDnode = taosArrayGet(pArray, i);
397,536✔
3124
    bool       inVgroup = false;
397,536✔
3125
    int64_t    oldMemUsed = 0;
397,536✔
3126
    int64_t    newMemUsed = 0;
397,536✔
3127
    mDebug("db:%s, vgId:%d, check dnode:%d, avail:%" PRId64 " used:%" PRId64, pNewVgroup->dbName, pNewVgroup->vgId,
397,536✔
3128
           pDnode->id, pDnode->memAvail, pDnode->memUsed);
3129
    for (int32_t j = 0; j < pOldVgroup->replica; ++j) {
1,112,640✔
3130
      SVnodeGid *pVgId = &pOldVgroup->vnodeGid[j];
715,104✔
3131
      if (pDnode->id == pVgId->dnodeId) {
715,104✔
3132
        oldMemUsed = mndGetVgroupMemory(pMnode, pOldDb, pOldVgroup);
314,500✔
3133
        inVgroup = true;
314,500✔
3134
      }
3135
    }
3136
    for (int32_t j = 0; j < pNewVgroup->replica; ++j) {
1,112,640✔
3137
      SVnodeGid *pVgId = &pNewVgroup->vnodeGid[j];
715,104✔
3138
      if (pDnode->id == pVgId->dnodeId) {
715,104✔
3139
        newMemUsed = mndGetVgroupMemory(pMnode, pNewDb, pNewVgroup);
314,500✔
3140
        inVgroup = true;
314,500✔
3141
      }
3142
    }
3143

3144
    mDebug("db:%s, vgId:%d, memory in dnode:%d, oldUsed:%" PRId64 ", newUsed:%" PRId64, pNewVgroup->dbName,
397,536✔
3145
           pNewVgroup->vgId, pDnode->id, oldMemUsed, newMemUsed);
3146

3147
    pDnode->memUsed = pDnode->memUsed - oldMemUsed + newMemUsed;
397,536✔
3148
    if (pDnode->memAvail - pDnode->memUsed <= 0) {
397,536✔
3149
      mError("db:%s, vgId:%d, no enough memory in dnode:%d, avail:%" PRId64 " used:%" PRId64, pNewVgroup->dbName,
×
3150
             pNewVgroup->vgId, pDnode->id, pDnode->memAvail, pDnode->memUsed);
3151
      TAOS_RETURN(TSDB_CODE_MND_NO_ENOUGH_MEM_IN_DNODE);
×
3152
    } else if (inVgroup) {
397,536✔
3153
      mInfo("db:%s, vgId:%d, memory in dnode:%d, avail:%" PRId64 " used:%" PRId64, pNewVgroup->dbName, pNewVgroup->vgId,
314,500✔
3154
            pDnode->id, pDnode->memAvail, pDnode->memUsed);
3155
    } else {
3156
    }
3157
  }
3158
  return 0;
208,644✔
3159
}
3160

3161
int32_t mndBuildAlterVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pOldDb, SDbObj *pNewDb, SVgObj *pVgroup,
250,166✔
3162
                                  SArray *pArray, SVgObj *pNewVgroup) {
3163
  int32_t code = 0;
250,166✔
3164
  memcpy(pNewVgroup, pVgroup, sizeof(SVgObj));
250,166✔
3165

3166
  if (pVgroup->replica <= 0 || pVgroup->replica == pNewDb->cfg.replications) {
250,166✔
3167
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfigAction(pMnode, pTrans, pNewDb, pVgroup));
208,644✔
3168
    TAOS_CHECK_RETURN(mndCheckDnodeMemory(pMnode, pOldDb, pNewDb, pNewVgroup, pVgroup, pArray));
208,644✔
3169
    return 0;
208,644✔
3170
  }
3171

3172
  // mndTransSetGroupParallel(pTrans);
3173

3174
  if (pNewDb->cfg.replications == 3) {
41,522✔
3175
    mInfo("trans:%d, db:%s, vgId:%d, will add 2 vnodes, vn:0 dnode:%d", pTrans->id, pVgroup->dbName, pVgroup->vgId,
35,111✔
3176
          pVgroup->vnodeGid[0].dnodeId);
3177

3178
    // add second
3179
    if (pNewVgroup->replica == 1) {
35,111✔
3180
      TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, pNewVgroup, pArray));
35,111✔
3181
    }
3182

3183
    // learner stage
3184
    pNewVgroup->vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
34,375✔
3185
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
34,375✔
3186
    TAOS_CHECK_RETURN(
34,375✔
3187
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3188

3189
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &pNewVgroup->vnodeGid[1]));
34,375✔
3190

3191
    // follower stage
3192
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
34,375✔
3193
    TAOS_CHECK_RETURN(mndAddAlterVnodeTypeAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
34,375✔
3194
    TAOS_CHECK_RETURN(
34,375✔
3195
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3196

3197
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
34,375✔
3198

3199
    // add third
3200
    if (pNewVgroup->replica == 2) {
34,375✔
3201
      TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, pNewVgroup, pArray));
34,375✔
3202
    }
3203

3204
    pNewVgroup->vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
34,288✔
3205
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
34,288✔
3206
    pNewVgroup->vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_VOTER;
34,288✔
3207
    TAOS_CHECK_RETURN(
34,288✔
3208
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3209
    TAOS_CHECK_RETURN(
34,288✔
3210
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
3211
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &pNewVgroup->vnodeGid[2]));
34,288✔
3212

3213
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
34,288✔
3214
  } else if (pNewDb->cfg.replications == 1) {
6,411✔
3215
    mInfo("trans:%d, db:%s, vgId:%d, will remove 2 vnodes, vn:0 dnode:%d vn:1 dnode:%d vn:2 dnode:%d", pTrans->id,
4,941✔
3216
          pVgroup->dbName, pVgroup->vgId, pVgroup->vnodeGid[0].dnodeId, pVgroup->vnodeGid[1].dnodeId,
3217
          pVgroup->vnodeGid[2].dnodeId);
3218

3219
    SVnodeGid del1 = {0};
4,941✔
3220
    SVnodeGid del2 = {0};
4,941✔
3221
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroup(pMnode, pTrans, pNewVgroup, pArray, &del1));
4,941✔
3222
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &del1, true));
4,941✔
3223
    TAOS_CHECK_RETURN(
4,941✔
3224
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3225
    TAOS_CHECK_RETURN(
4,941✔
3226
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
3227
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
4,941✔
3228

3229
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroup(pMnode, pTrans, pNewVgroup, pArray, &del2));
4,941✔
3230
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &del2, true));
4,941✔
3231
    TAOS_CHECK_RETURN(
4,941✔
3232
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3233
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
4,941✔
3234
  } else if (pNewDb->cfg.replications == 2) {
1,470✔
3235
    mInfo("trans:%d, db:%s, vgId:%d, will add 1 vnode, vn:0 dnode:%d", pTrans->id, pVgroup->dbName, pVgroup->vgId,
1,470✔
3236
          pVgroup->vnodeGid[0].dnodeId);
3237

3238
    // add second
3239
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, pNewVgroup, pArray));
1,470✔
3240

3241
    // learner stage
3242
    pNewVgroup->vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
1,470✔
3243
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
1,470✔
3244
    TAOS_CHECK_RETURN(
1,470✔
3245
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3246

3247
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, pNewVgroup, &pNewVgroup->vnodeGid[1]));
1,470✔
3248

3249
    // follower stage
3250
    pNewVgroup->vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
1,470✔
3251
    TAOS_CHECK_RETURN(mndAddAlterVnodeTypeAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[1].dnodeId));
1,470✔
3252
    TAOS_CHECK_RETURN(
1,470✔
3253
        mndAddAlterVnodeReplicaAction(pMnode, pTrans, pNewDb, pNewVgroup, pNewVgroup->vnodeGid[0].dnodeId));
3254

3255
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, pNewVgroup));
1,470✔
3256
  } else {
3257
    return -1;
×
3258
  }
3259

3260
  mndSortVnodeGid(pNewVgroup);
40,699✔
3261

3262
  {
3263
    SSdbRaw *pVgRaw = mndVgroupActionEncode(pNewVgroup);
40,699✔
3264
    if (pVgRaw == NULL) {
40,699✔
3265
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3266
      if (terrno != 0) code = terrno;
×
3267
      TAOS_RETURN(code);
×
3268
    }
3269
    if ((code = mndTransAppendCommitlog(pTrans, pVgRaw)) != 0) {
40,699✔
3270
      sdbFreeRaw(pVgRaw);
×
3271
      TAOS_RETURN(code);
×
3272
    }
3273
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
40,699✔
3274
    if (code != 0) {
40,699✔
3275
      mError("vgId:%d, failed to set raw status since %s at line:%d", pNewVgroup->vgId, tstrerror(code), __LINE__);
×
3276
      TAOS_RETURN(code);
×
3277
    }
3278
  }
3279

3280
  TAOS_RETURN(code);
40,699✔
3281
}
3282

3283
int32_t mndBuildRaftAlterVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pOldDb, SDbObj *pNewDb, SVgObj *pVgroup,
×
3284
                                      SArray *pArray) {
3285
  int32_t code = 0;
×
3286
  SVgObj  newVgroup = {0};
×
3287
  memcpy(&newVgroup, pVgroup, sizeof(SVgObj));
×
3288

3289
  if (pVgroup->replica <= 0 || pVgroup->replica == pNewDb->cfg.replications) {
×
3290
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfigAction(pMnode, pTrans, pNewDb, pVgroup));
×
3291
    TAOS_CHECK_RETURN(mndCheckDnodeMemory(pMnode, pOldDb, pNewDb, &newVgroup, pVgroup, pArray));
×
3292
    return 0;
×
3293
  }
3294

3295
  mndTransSetSerial(pTrans);
×
3296

3297
  mInfo("trans:%d, vgId:%d, alter vgroup, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id, pVgroup->vgId,
×
3298
        pVgroup->syncConfChangeVer, pVgroup->version, pVgroup->replica);
3299

3300
  if (newVgroup.replica == 1 && pNewDb->cfg.replications == 3) {
×
3301
    mInfo("db:%s, vgId:%d, will add 2 vnodes, vn:0 dnode:%d", pVgroup->dbName, pVgroup->vgId,
×
3302
          pVgroup->vnodeGid[0].dnodeId);
3303

3304
    // add second
3305
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVgroup, pArray));
×
3306
    // add third
3307
    TAOS_CHECK_RETURN(mndAddVnodeToVgroup(pMnode, pTrans, &newVgroup, pArray));
×
3308

3309
    // add learner stage
3310
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3311
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3312
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3313
    TAOS_CHECK_RETURN(
×
3314
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3315
    mInfo("trans:%d, vgId:%d, add change config, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id,
×
3316
          pVgroup->vgId, newVgroup.syncConfChangeVer, pVgroup->version, pVgroup->replica);
3317
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &newVgroup.vnodeGid[1]));
×
3318
    mInfo("trans:%d, vgId:%d, create vnode, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id, pVgroup->vgId,
×
3319
          newVgroup.syncConfChangeVer, pVgroup->version, pVgroup->replica);
3320
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &newVgroup.vnodeGid[2]));
×
3321
    mInfo("trans:%d, vgId:%d, create vnode, syncConfChangeVer:%d, version:%d, replica:%d", pTrans->id, pVgroup->vgId,
×
3322
          newVgroup.syncConfChangeVer, pVgroup->version, pVgroup->replica);
3323

3324
    // check learner
3325
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3326
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3327
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3328
    TAOS_CHECK_RETURN(
×
3329
        mndAddCheckLearnerCatchupAction(pMnode, pTrans, pNewDb, &newVgroup, newVgroup.vnodeGid[1].dnodeId));
3330
    TAOS_CHECK_RETURN(
×
3331
        mndAddCheckLearnerCatchupAction(pMnode, pTrans, pNewDb, &newVgroup, newVgroup.vnodeGid[2].dnodeId));
3332

3333
    // change raft type
3334
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3335
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3336
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3337
    TAOS_CHECK_RETURN(
×
3338
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3339

3340
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3341

3342
    newVgroup.vnodeGid[0].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3343
    newVgroup.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3344
    newVgroup.vnodeGid[2].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3345
    TAOS_CHECK_RETURN(
×
3346
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3347

3348
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3349

3350
    SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3351
    if (pVgRaw == NULL) {
×
3352
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3353
      if (terrno != 0) code = terrno;
×
3354
      TAOS_RETURN(code);
×
3355
    }
3356
    if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
×
3357
      sdbFreeRaw(pVgRaw);
×
3358
      TAOS_RETURN(code);
×
3359
    }
3360
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3361
    if (code != 0) {
×
3362
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3363
             __LINE__);
3364
      TAOS_RETURN(code);
×
3365
    }
3366
  } else if (newVgroup.replica == 3 && pNewDb->cfg.replications == 1) {
×
3367
    mInfo("db:%s, vgId:%d, will remove 2 vnodes, vn:0 dnode:%d vn:1 dnode:%d vn:2 dnode:%d", pVgroup->dbName,
×
3368
          pVgroup->vgId, pVgroup->vnodeGid[0].dnodeId, pVgroup->vnodeGid[1].dnodeId, pVgroup->vnodeGid[2].dnodeId);
3369

3370
    SVnodeGid del1 = {0};
×
3371
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroupWithoutSave(pMnode, pTrans, &newVgroup, pArray, &del1));
×
3372

3373
    TAOS_CHECK_RETURN(
×
3374
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3375

3376
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3377

3378
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &del1, true));
×
3379

3380
    SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3381
    if (pVgRaw == NULL) {
×
3382
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3383
      if (terrno != 0) code = terrno;
×
3384
      TAOS_RETURN(code);
×
3385
    }
3386
    if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
×
3387
      sdbFreeRaw(pVgRaw);
×
3388
      TAOS_RETURN(code);
×
3389
    }
3390
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3391
    if (code != 0) {
×
3392
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3393
             __LINE__);
3394
      TAOS_RETURN(code);
×
3395
    }
3396

3397
    SVnodeGid del2 = {0};
×
3398
    TAOS_CHECK_RETURN(mndRemoveVnodeFromVgroupWithoutSave(pMnode, pTrans, &newVgroup, pArray, &del2));
×
3399

3400
    TAOS_CHECK_RETURN(
×
3401
        mndAddChangeConfigAction(pMnode, pTrans, pNewDb, pVgroup, &newVgroup, newVgroup.vnodeGid[0].dnodeId));
3402

3403
    TAOS_CHECK_RETURN(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pNewDb, &newVgroup));
×
3404

3405
    TAOS_CHECK_RETURN(mndAddDropVnodeAction(pMnode, pTrans, pNewDb, &newVgroup, &del2, true));
×
3406

3407
    pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3408
    if (pVgRaw == NULL) {
×
3409
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3410
      if (terrno != 0) code = terrno;
×
3411
      TAOS_RETURN(code);
×
3412
    }
3413
    if ((code = mndTransAppendRedolog(pTrans, pVgRaw)) != 0) {
×
3414
      sdbFreeRaw(pVgRaw);
×
3415
      TAOS_RETURN(code);
×
3416
    }
3417
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3418
    if (code != 0) {
×
3419
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3420
             __LINE__);
3421
      TAOS_RETURN(code);
×
3422
    }
3423
  } else {
3424
    return -1;
×
3425
  }
3426

3427
  mndSortVnodeGid(&newVgroup);
×
3428

3429
  {
3430
    SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
×
3431
    if (pVgRaw == NULL) {
×
3432
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3433
      if (terrno != 0) code = terrno;
×
3434
      TAOS_RETURN(code);
×
3435
    }
3436
    if ((code = mndTransAppendCommitlog(pTrans, pVgRaw)) != 0) {
×
3437
      sdbFreeRaw(pVgRaw);
×
3438
      TAOS_RETURN(code);
×
3439
    }
3440
    code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
×
3441
    if (code != 0) {
×
3442
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code),
×
3443
             __LINE__);
3444
      TAOS_RETURN(code);
×
3445
    }
3446
  }
3447

3448
  TAOS_RETURN(code);
×
3449
}
3450

3451
int32_t mndBuildRestoreAlterVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *db, SVgObj *pVgroup, SDnodeObj *pDnode,
6,095✔
3452
                                         SDnodeObj *pAnotherDnode) {
3453
  int32_t code = 0;
6,095✔
3454
  SVgObj  newVgroup = {0};
6,095✔
3455
  memcpy(&newVgroup, pVgroup, sizeof(SVgObj));
6,095✔
3456

3457
  mInfo("trans:%d, db:%s, vgId:%d, restore vnodes, vn:0 dnode:%d", pTrans->id, pVgroup->dbName, pVgroup->vgId,
6,095✔
3458
        pVgroup->vnodeGid[0].dnodeId);
3459

3460
  if (newVgroup.replica == 1) {
6,095✔
3461
    int selected = 0;
×
3462
    for (int i = 0; i < newVgroup.replica; i++) {
×
3463
      newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3464
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3465
        selected = i;
×
3466
      }
3467
    }
3468
    TAOS_CHECK_RETURN(mndAddCreateVnodeAction(pMnode, pTrans, db, &newVgroup, &newVgroup.vnodeGid[selected]));
×
3469
  } else if (newVgroup.replica == 2) {
6,095✔
3470
    for (int i = 0; i < newVgroup.replica; i++) {
×
3471
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3472
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3473
      } else {
3474
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3475
      }
3476
    }
3477
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pAnotherDnode));
×
3478

3479
    for (int i = 0; i < newVgroup.replica; i++) {
×
3480
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3481
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_LEARNER;
×
3482
      } else {
3483
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3484
      }
3485
    }
3486
    TAOS_CHECK_RETURN(mndRestoreAddCreateVnodeAction(pMnode, pTrans, db, &newVgroup, pDnode));
×
3487

3488
    for (int i = 0; i < newVgroup.replica; i++) {
×
3489
      newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
×
3490
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
×
3491
      }
3492
    }
3493
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pDnode));
×
3494
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pAnotherDnode));
×
3495
  } else if (newVgroup.replica == 3) {
6,095✔
3496
    for (int i = 0; i < newVgroup.replica; i++) {
24,380✔
3497
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
18,285✔
3498
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_LEARNER;
6,095✔
3499
      } else {
3500
        newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
12,190✔
3501
      }
3502
    }
3503
    TAOS_CHECK_RETURN(mndRestoreAddCreateVnodeAction(pMnode, pTrans, db, &newVgroup, pDnode));
6,095✔
3504

3505
    for (int i = 0; i < newVgroup.replica; i++) {
24,380✔
3506
      newVgroup.vnodeGid[i].nodeRole = TAOS_SYNC_ROLE_VOTER;
18,285✔
3507
      if (newVgroup.vnodeGid[i].dnodeId == pDnode->id) {
18,285✔
3508
      }
3509
    }
3510
    TAOS_CHECK_RETURN(mndRestoreAddAlterVnodeTypeAction(pMnode, pTrans, db, &newVgroup, pDnode));
6,095✔
3511
  }
3512
  SSdbRaw *pVgRaw = mndVgroupActionEncode(&newVgroup);
6,095✔
3513
  if (pVgRaw == NULL) {
6,095✔
3514
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3515
    if (terrno != 0) code = terrno;
×
3516
    TAOS_RETURN(code);
×
3517
  }
3518
  if ((code = mndTransAppendCommitlog(pTrans, pVgRaw)) != 0) {
6,095✔
3519
    sdbFreeRaw(pVgRaw);
×
3520
    TAOS_RETURN(code);
×
3521
  }
3522
  code = sdbSetRawStatus(pVgRaw, SDB_STATUS_READY);
6,095✔
3523
  if (code != 0) {
6,095✔
3524
    mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVgroup.vgId, tstrerror(code), __LINE__);
×
3525
    TAOS_RETURN(code);
×
3526
  }
3527

3528
  TAOS_RETURN(code);
6,095✔
3529
}
3530

3531
static int32_t mndAddAdjustVnodeHashRangeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup) {
×
3532
  return 0;
×
3533
}
3534

3535
typedef int32_t (*FpTransActionCb)(STrans *pTrans, SSdbRaw *pRaw);
3536

3537
static int32_t mndAddVgStatusAction(STrans *pTrans, SVgObj *pVg, ESdbStatus vgStatus, ETrnStage stage) {
73,705✔
3538
  int32_t         code = 0;
73,705✔
3539
  FpTransActionCb appendActionCb = (stage == TRN_STAGE_COMMIT_ACTION) ? mndTransAppendCommitlog : mndTransAppendRedolog;
73,705✔
3540
  SSdbRaw        *pRaw = mndVgroupActionEncode(pVg);
73,705✔
3541
  if (pRaw == NULL) {
73,705✔
3542
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3543
    if (terrno != 0) code = terrno;
×
3544
    goto _err;
×
3545
  }
3546
  if ((code = appendActionCb(pTrans, pRaw)) != 0) goto _err;
73,705✔
3547
  code = sdbSetRawStatus(pRaw, vgStatus);
73,705✔
3548
  if (code != 0) {
73,705✔
3549
    mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", pVg->vgId, tstrerror(code), __LINE__);
×
3550
    goto _err;
×
3551
  }
3552
  pRaw = NULL;
73,705✔
3553
  TAOS_RETURN(code);
73,705✔
3554
_err:
×
3555
  sdbFreeRaw(pRaw);
×
3556
  TAOS_RETURN(code);
×
3557
}
3558

3559
static int32_t mndAddDbStatusAction(STrans *pTrans, SDbObj *pDb, ESdbStatus dbStatus, ETrnStage stage) {
30,179✔
3560
  int32_t         code = 0;
30,179✔
3561
  FpTransActionCb appendActionCb = (stage == TRN_STAGE_COMMIT_ACTION) ? mndTransAppendCommitlog : mndTransAppendRedolog;
30,179✔
3562
  SSdbRaw        *pRaw = mndDbActionEncode(pDb);
30,179✔
3563
  if (pRaw == NULL) {
30,179✔
3564
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3565
    if (terrno != 0) code = terrno;
×
3566
    goto _err;
×
3567
  }
3568
  if ((code = appendActionCb(pTrans, pRaw)) != 0) goto _err;
30,179✔
3569
  code = sdbSetRawStatus(pRaw, dbStatus);
30,179✔
3570
  if (code != 0) {
30,179✔
3571
    mError("db:%s, failed to set raw status to ready, error:%s, line:%d", pDb->name, tstrerror(code), __LINE__);
×
3572
    goto _err;
×
3573
  }
3574
  pRaw = NULL;
30,179✔
3575
  TAOS_RETURN(code);
30,179✔
3576
_err:
×
3577
  sdbFreeRaw(pRaw);
×
3578
  TAOS_RETURN(code);
×
3579
}
3580

3581
int32_t mndSplitVgroup(SMnode *pMnode, SRpcMsg *pReq, SDbObj *pDb, SVgObj *pVgroup) {
15,467✔
3582
  int32_t code = -1;
15,467✔
3583
  STrans *pTrans = NULL;
15,467✔
3584
  SDbObj  dbObj = {0};
15,467✔
3585
  SArray *pArray = mndBuildDnodesArray(pMnode, 0, NULL);
15,467✔
3586

3587
#if defined(USE_SHARED_STORAGE)
3588
  if (tsSsEnabled) {
15,467✔
3589
    code = TSDB_CODE_OPS_NOT_SUPPORT;
×
3590
    mError("vgId:%d, db:%s, shared storage exists, split vgroup not allowed", pVgroup->vgId, pVgroup->dbName);
×
3591
    goto _OVER;
×
3592
  }
3593
#endif
3594

3595
  /*
3596
    if (pDb->cfg.withArbitrator) {
3597
      code = TSDB_CODE_OPS_NOT_SUPPORT;
3598
      mError("vgId:%d, db:%s, with arbitrator, split vgroup not allowed", pVgroup->vgId, pVgroup->dbName);
3599
      goto _OVER;
3600
    }
3601
  */
3602

3603
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_DB, pReq, "split-vgroup");
15,467✔
3604
  if (pTrans == NULL) {
15,467✔
3605
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3606
    if (terrno != 0) code = terrno;
×
3607
    goto _OVER;
×
3608
  }
3609
  mndTransSetSerial(pTrans);
15,467✔
3610
  mInfo("trans:%d, used to split vgroup, vgId:%d", pTrans->id, pVgroup->vgId);
15,467✔
3611

3612
  mndTransSetDbName(pTrans, pDb->name, NULL);
15,467✔
3613
  TAOS_CHECK_GOTO(mndTransCheckConflictWithCompact(pMnode, pTrans), NULL, _OVER);
15,467✔
3614
  TAOS_CHECK_GOTO(mndTransCheckConflictWithRetention(pMnode, pTrans), NULL, _OVER);
15,197✔
3615

3616
  SVgObj newVg1 = {0};
15,197✔
3617
  memcpy(&newVg1, pVgroup, sizeof(SVgObj));
15,197✔
3618
  mInfo("vgId:%d, vgroup info before split, replica:%d hashBegin:%u hashEnd:%u", newVg1.vgId, newVg1.replica,
15,197✔
3619
        newVg1.hashBegin, newVg1.hashEnd);
3620
  for (int32_t i = 0; i < newVg1.replica; ++i) {
46,793✔
3621
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg1.vgId, i, newVg1.vnodeGid[i].dnodeId);
31,596✔
3622
  }
3623

3624
  if (newVg1.replica == 1) {
15,197✔
3625
    TAOS_CHECK_GOTO(mndAddVnodeToVgroup(pMnode, pTrans, &newVg1, pArray), NULL, _OVER);
6,630✔
3626

3627
    newVg1.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_LEARNER;
6,630✔
3628
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[0].dnodeId), NULL,
6,630✔
3629
                    _OVER);
3630
    TAOS_CHECK_GOTO(mndAddCreateVnodeAction(pMnode, pTrans, pDb, &newVg1, &newVg1.vnodeGid[1]), NULL, _OVER);
6,630✔
3631

3632
    newVg1.vnodeGid[1].nodeRole = TAOS_SYNC_ROLE_VOTER;
6,630✔
3633
    TAOS_CHECK_GOTO(mndAddAlterVnodeTypeAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[1].dnodeId), NULL, _OVER);
6,630✔
3634
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[0].dnodeId), NULL,
6,630✔
3635
                    _OVER);
3636

3637
    TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg1), NULL, _OVER);
6,630✔
3638
  } else if (newVg1.replica == 3) {
8,567✔
3639
    SVnodeGid del1 = {0};
7,832✔
3640
    TAOS_CHECK_GOTO(mndRemoveVnodeFromVgroup(pMnode, pTrans, &newVg1, pArray, &del1), NULL, _OVER);
7,832✔
3641
    TAOS_CHECK_GOTO(mndAddDropVnodeAction(pMnode, pTrans, pDb, &newVg1, &del1, true), NULL, _OVER);
7,768✔
3642
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[0].dnodeId), NULL,
7,768✔
3643
                    _OVER);
3644
    TAOS_CHECK_GOTO(mndAddAlterVnodeReplicaAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[1].dnodeId), NULL,
7,768✔
3645
                    _OVER);
3646
  } else {
3647
    // goto _OVER;
3648
  }
3649

3650
  for (int32_t i = 0; i < newVg1.replica; ++i) {
45,399✔
3651
    TAOS_CHECK_GOTO(mndAddDisableVnodeWriteAction(pMnode, pTrans, pDb, &newVg1, newVg1.vnodeGid[i].dnodeId), NULL,
30,266✔
3652
                    _OVER);
3653
  }
3654
  TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg1), NULL, _OVER);
15,133✔
3655

3656
  SVgObj newVg2 = {0};
15,133✔
3657
  memcpy(&newVg2, &newVg1, sizeof(SVgObj));
15,133✔
3658
  newVg1.replica = 1;
15,133✔
3659
  newVg1.hashEnd = newVg1.hashBegin / 2 + newVg1.hashEnd / 2;
15,133✔
3660
  memset(&newVg1.vnodeGid[1], 0, sizeof(SVnodeGid));
15,133✔
3661

3662
  newVg2.replica = 1;
15,133✔
3663
  newVg2.hashBegin = newVg1.hashEnd + 1;
15,133✔
3664
  memcpy(&newVg2.vnodeGid[0], &newVg2.vnodeGid[1], sizeof(SVnodeGid));
15,133✔
3665
  memset(&newVg2.vnodeGid[1], 0, sizeof(SVnodeGid));
15,133✔
3666

3667
  mInfo("vgId:%d, vgroup info after split, replica:%d hashrange:[%u, %u] vnode:0 dnode:%d", newVg1.vgId, newVg1.replica,
15,133✔
3668
        newVg1.hashBegin, newVg1.hashEnd, newVg1.vnodeGid[0].dnodeId);
3669
  for (int32_t i = 0; i < newVg1.replica; ++i) {
30,266✔
3670
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg1.vgId, i, newVg1.vnodeGid[i].dnodeId);
15,133✔
3671
  }
3672
  mInfo("vgId:%d, vgroup info after split, replica:%d hashrange:[%u, %u] vnode:0 dnode:%d", newVg2.vgId, newVg2.replica,
15,133✔
3673
        newVg2.hashBegin, newVg2.hashEnd, newVg2.vnodeGid[0].dnodeId);
3674
  for (int32_t i = 0; i < newVg1.replica; ++i) {
30,266✔
3675
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg2.vgId, i, newVg2.vnodeGid[i].dnodeId);
15,133✔
3676
  }
3677

3678
  // alter vgId and hash range
3679
  int32_t maxVgId = sdbGetMaxId(pMnode->pSdb, SDB_VGROUP);
15,133✔
3680
  int32_t srcVgId = newVg1.vgId;
15,133✔
3681
  newVg1.vgId = maxVgId;
15,133✔
3682
  TAOS_CHECK_GOTO(mndAddNewVgPrepareAction(pMnode, pTrans, &newVg1), NULL, _OVER);
15,133✔
3683
  TAOS_CHECK_GOTO(mndAddAlterVnodeHashRangeAction(pMnode, pTrans, srcVgId, &newVg1), NULL, _OVER);
15,133✔
3684

3685
  maxVgId++;
15,133✔
3686
  srcVgId = newVg2.vgId;
15,133✔
3687
  newVg2.vgId = maxVgId;
15,133✔
3688
  TAOS_CHECK_GOTO(mndAddNewVgPrepareAction(pMnode, pTrans, &newVg2), NULL, _OVER);
15,133✔
3689
  TAOS_CHECK_GOTO(mndAddAlterVnodeHashRangeAction(pMnode, pTrans, srcVgId, &newVg2), NULL, _OVER);
15,133✔
3690

3691
  TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg1), NULL, _OVER);
15,133✔
3692
  TAOS_CHECK_GOTO(mndAddAlterVnodeConfirmAction(pMnode, pTrans, pDb, &newVg2), NULL, _OVER);
15,133✔
3693

3694
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg1, SDB_STATUS_READY, TRN_STAGE_REDO_ACTION), NULL, _OVER);
15,133✔
3695
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg2, SDB_STATUS_READY, TRN_STAGE_REDO_ACTION), NULL, _OVER);
15,133✔
3696
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, pVgroup, SDB_STATUS_DROPPED, TRN_STAGE_REDO_ACTION), NULL, _OVER);
15,133✔
3697

3698
  // update db status
3699
  memcpy(&dbObj, pDb, sizeof(SDbObj));
15,133✔
3700
  if (dbObj.cfg.pRetensions != NULL) {
15,133✔
3701
    dbObj.cfg.pRetensions = taosArrayDup(pDb->cfg.pRetensions, NULL);
×
3702
    if (dbObj.cfg.pRetensions == NULL) {
×
3703
      code = terrno;
×
3704
      goto _OVER;
×
3705
    }
3706
  }
3707
  dbObj.vgVersion++;
15,133✔
3708
  dbObj.updateTime = taosGetTimestampMs();
15,133✔
3709
  dbObj.cfg.numOfVgroups++;
15,133✔
3710
  TAOS_CHECK_GOTO(mndAddDbStatusAction(pTrans, &dbObj, SDB_STATUS_READY, TRN_STAGE_REDO_ACTION), NULL, _OVER);
15,133✔
3711

3712
  // adjust vgroup replica
3713
  if (pDb->cfg.replications != newVg1.replica) {
15,133✔
3714
    SVgObj tmpGroup = {0};
8,503✔
3715
    TAOS_CHECK_GOTO(mndBuildAlterVgroupAction(pMnode, pTrans, pDb, pDb, &newVg1, pArray, &tmpGroup), NULL, _OVER);
8,503✔
3716
  } else {
3717
    TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg1, SDB_STATUS_READY, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
6,630✔
3718
  }
3719

3720
  if (pDb->cfg.replications != newVg2.replica) {
15,067✔
3721
    SVgObj tmpGroup = {0};
8,437✔
3722
    TAOS_CHECK_GOTO(mndBuildAlterVgroupAction(pMnode, pTrans, pDb, pDb, &newVg2, pArray, &tmpGroup), NULL, _OVER);
8,437✔
3723
  } else {
3724
    TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, &newVg2, SDB_STATUS_READY, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
6,630✔
3725
  }
3726

3727
  TAOS_CHECK_GOTO(mndAddVgStatusAction(pTrans, pVgroup, SDB_STATUS_DROPPED, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
15,046✔
3728

3729
  // commit db status
3730
  dbObj.vgVersion++;
15,046✔
3731
  dbObj.updateTime = taosGetTimestampMs();
15,046✔
3732
  TAOS_CHECK_GOTO(mndAddDbStatusAction(pTrans, &dbObj, SDB_STATUS_READY, TRN_STAGE_COMMIT_ACTION), NULL, _OVER);
15,046✔
3733

3734
  TAOS_CHECK_GOTO(mndTransPrepare(pMnode, pTrans), NULL, _OVER);
15,046✔
3735
  code = 0;
15,046✔
3736

3737
_OVER:
15,467✔
3738
  taosArrayDestroy(pArray);
15,467✔
3739
  mndTransDrop(pTrans);
15,467✔
3740
  taosArrayDestroy(dbObj.cfg.pRetensions);
15,467✔
3741
  TAOS_RETURN(code);
15,467✔
3742
}
3743

3744
extern int32_t mndProcessSplitVgroupMsgImp(SRpcMsg *pReq);
3745

3746
static int32_t mndProcessSplitVgroupMsg(SRpcMsg *pReq) { return mndProcessSplitVgroupMsgImp(pReq); }
16,209✔
3747

3748
#ifndef TD_ENTERPRISE
3749
int32_t mndProcessSplitVgroupMsgImp(SRpcMsg *pReq) { return 0; }
3750
#endif
3751

3752
static int32_t mndSetBalanceVgroupInfoToTrans(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup,
15,255✔
3753
                                              SDnodeObj *pSrc, SDnodeObj *pDst) {
3754
  int32_t code = 0;
15,255✔
3755
  SVgObj  newVg = {0};
15,255✔
3756
  memcpy(&newVg, pVgroup, sizeof(SVgObj));
15,255✔
3757
  mInfo("vgId:%d, vgroup info before balance, replica:%d", newVg.vgId, newVg.replica);
15,255✔
3758
  for (int32_t i = 0; i < newVg.replica; ++i) {
44,930✔
3759
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
29,675✔
3760
  }
3761

3762
  TAOS_CHECK_RETURN(mndAddIncVgroupReplicaToTrans(pMnode, pTrans, pDb, &newVg, pDst->id));
15,255✔
3763
  TAOS_CHECK_RETURN(mndAddDecVgroupReplicaFromTrans(pMnode, pTrans, pDb, &newVg, pSrc->id));
15,255✔
3764

3765
  {
3766
    SSdbRaw *pRaw = mndVgroupActionEncode(&newVg);
15,255✔
3767
    if (pRaw == NULL) {
15,255✔
3768
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3769
      if (terrno != 0) code = terrno;
×
3770
      TAOS_RETURN(code);
×
3771
    }
3772
    if ((code = mndTransAppendCommitlog(pTrans, pRaw)) != 0) {
15,255✔
3773
      sdbFreeRaw(pRaw);
×
3774
      TAOS_RETURN(code);
×
3775
    }
3776
    code = sdbSetRawStatus(pRaw, SDB_STATUS_READY);
15,255✔
3777
    if (code != 0) {
15,255✔
3778
      mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", newVg.vgId, tstrerror(code), __LINE__);
×
3779
      TAOS_RETURN(code);
×
3780
    }
3781
  }
3782

3783
  mInfo("vgId:%d, vgroup info after balance, replica:%d", newVg.vgId, newVg.replica);
15,255✔
3784
  for (int32_t i = 0; i < newVg.replica; ++i) {
44,930✔
3785
    mInfo("vgId:%d, vnode:%d dnode:%d", newVg.vgId, i, newVg.vnodeGid[i].dnodeId);
29,675✔
3786
  }
3787
  TAOS_RETURN(code);
15,255✔
3788
}
3789

3790
static int32_t mndBalanceVgroupBetweenDnode(SMnode *pMnode, STrans *pTrans, SDnodeObj *pSrc, SDnodeObj *pDst,
15,255✔
3791
                                            SHashObj *pBalancedVgroups) {
3792
  void   *pIter = NULL;
15,255✔
3793
  int32_t code = -1;
15,255✔
3794
  SSdb   *pSdb = pMnode->pSdb;
15,255✔
3795

3796
  while (1) {
9,394✔
3797
    SVgObj *pVgroup = NULL;
24,649✔
3798
    pIter = sdbFetch(pSdb, SDB_VGROUP, pIter, (void **)&pVgroup);
24,649✔
3799
    if (pIter == NULL) break;
24,649✔
3800
    if (taosHashGet(pBalancedVgroups, &pVgroup->vgId, sizeof(int32_t)) != NULL) {
24,649✔
3801
      sdbRelease(pSdb, pVgroup);
8,665✔
3802
      continue;
8,665✔
3803
    }
3804

3805
    bool existInSrc = false;
15,984✔
3806
    bool existInDst = false;
15,984✔
3807
    for (int32_t i = 0; i < pVgroup->replica; ++i) {
46,388✔
3808
      SVnodeGid *pGid = &pVgroup->vnodeGid[i];
30,404✔
3809
      if (pGid->dnodeId == pSrc->id) existInSrc = true;
30,404✔
3810
      if (pGid->dnodeId == pDst->id) existInDst = true;
30,404✔
3811
    }
3812

3813
    if (!existInSrc || existInDst) {
15,984✔
3814
      sdbRelease(pSdb, pVgroup);
729✔
3815
      continue;
729✔
3816
    }
3817

3818
    SDbObj *pDb = mndAcquireDb(pMnode, pVgroup->dbName);
15,255✔
3819
    if (pDb == NULL) {
15,255✔
3820
      code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3821
      if (terrno != 0) code = terrno;
×
3822
      mError("vgId:%d, balance vgroup can't find db obj dbName:%s", pVgroup->vgId, pVgroup->dbName);
×
3823
      goto _OUT;
×
3824
    }
3825

3826
    if (pDb->cfg.withArbitrator) {
15,255✔
3827
      mInfo("vgId:%d, db:%s, with arbitrator, balance vgroup not allowed", pVgroup->vgId, pVgroup->dbName);
×
3828
      goto _OUT;
×
3829
    }
3830

3831
    code = mndSetBalanceVgroupInfoToTrans(pMnode, pTrans, pDb, pVgroup, pSrc, pDst);
15,255✔
3832
    if (code == 0) {
15,255✔
3833
      code = taosHashPut(pBalancedVgroups, &pVgroup->vgId, sizeof(int32_t), &pVgroup->vgId, sizeof(int32_t));
15,255✔
3834
    }
3835

3836
  _OUT:
15,255✔
3837
    mndReleaseDb(pMnode, pDb);
15,255✔
3838
    sdbRelease(pSdb, pVgroup);
15,255✔
3839
    sdbCancelFetch(pSdb, pIter);
15,255✔
3840
    break;
15,255✔
3841
  }
3842

3843
  return code;
15,255✔
3844
}
3845

3846
static int32_t mndBalanceVgroup(SMnode *pMnode, SRpcMsg *pReq, SArray *pArray) {
12,442✔
3847
  int32_t   code = -1;
12,442✔
3848
  int32_t   numOfVgroups = 0;
12,442✔
3849
  STrans   *pTrans = NULL;
12,442✔
3850
  SHashObj *pBalancedVgroups = NULL;
12,442✔
3851

3852
  pBalancedVgroups = taosHashInit(16, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT), false, HASH_NO_LOCK);
12,442✔
3853
  if (pBalancedVgroups == NULL) goto _OVER;
12,442✔
3854

3855
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_GLOBAL, pReq, "balance-vgroup");
12,442✔
3856
  if (pTrans == NULL) {
12,442✔
3857
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3858
    if (terrno != 0) code = terrno;
×
3859
    goto _OVER;
×
3860
  }
3861
  mndTransSetSerial(pTrans);
12,442✔
3862
  mInfo("trans:%d, used to balance vgroup", pTrans->id);
12,442✔
3863
  TAOS_CHECK_GOTO(mndTransCheckConflict(pMnode, pTrans), NULL, _OVER);
12,442✔
3864
  TAOS_CHECK_GOTO(mndTransCheckConflictWithCompact(pMnode, pTrans), NULL, _OVER);
9,742✔
3865
  TAOS_CHECK_GOTO(mndTransCheckConflictWithRetention(pMnode, pTrans), NULL, _OVER);
9,472✔
3866

3867
  while (1) {
15,255✔
3868
    taosArraySort(pArray, (__compar_fn_t)mndCompareDnodeVnodes);
24,727✔
3869
    for (int32_t i = 0; i < taosArrayGetSize(pArray); ++i) {
106,714✔
3870
      SDnodeObj *pDnode = taosArrayGet(pArray, i);
81,987✔
3871
      mInfo("dnode:%d, equivalent vnodes:%d others:%d support:%d, score:%f", pDnode->id, pDnode->numOfVnodes,
81,987✔
3872
            pDnode->numOfSupportVnodes, pDnode->numOfOtherNodes, mndGetDnodeScore(pDnode, 0, 1));
3873
    }
3874

3875
    SDnodeObj *pSrc = taosArrayGet(pArray, taosArrayGetSize(pArray) - 1);
24,727✔
3876
    SDnodeObj *pDst = taosArrayGet(pArray, 0);
24,727✔
3877

3878
    float srcScore = mndGetDnodeScore(pSrc, -1, 1);
24,727✔
3879
    float dstScore = mndGetDnodeScore(pDst, 1, 1);
24,727✔
3880
    mInfo("trans:%d, after balance, src dnode:%d score:%f, dst dnode:%d score:%f", pTrans->id, pSrc->id, dstScore,
24,727✔
3881
          pDst->id, dstScore);
3882

3883
    if (srcScore > dstScore - 0.000001) {
24,727✔
3884
      code = mndBalanceVgroupBetweenDnode(pMnode, pTrans, pSrc, pDst, pBalancedVgroups);
15,255✔
3885
      if (code == 0) {
15,255✔
3886
        pSrc->numOfVnodes--;
15,255✔
3887
        pDst->numOfVnodes++;
15,255✔
3888
        numOfVgroups++;
15,255✔
3889
        continue;
15,255✔
3890
      } else {
3891
        mInfo("trans:%d, no vgroup need to balance from dnode:%d to dnode:%d", pTrans->id, pSrc->id, pDst->id);
×
3892
        break;
×
3893
      }
3894
    } else {
3895
      mInfo("trans:%d, no vgroup need to balance any more", pTrans->id);
9,472✔
3896
      break;
9,472✔
3897
    }
3898
  }
3899

3900
  if (numOfVgroups <= 0) {
9,472✔
3901
    mInfo("no need to balance vgroup");
×
3902
    code = 0;
×
3903
  } else {
3904
    mInfo("start to balance vgroup, numOfVgroups:%d", numOfVgroups);
9,472✔
3905
    if (mndTransPrepare(pMnode, pTrans) != 0) goto _OVER;
9,472✔
3906
    code = TSDB_CODE_ACTION_IN_PROGRESS;
9,472✔
3907
  }
3908

3909
_OVER:
12,442✔
3910
  taosHashCleanup(pBalancedVgroups);
12,442✔
3911
  mndTransDrop(pTrans);
12,442✔
3912
  TAOS_RETURN(code);
12,442✔
3913
}
3914

3915
static int32_t mndProcessBalanceVgroupMsg(SRpcMsg *pReq) {
14,267✔
3916
  SMnode *pMnode = pReq->info.node;
14,267✔
3917
  int32_t code = -1;
14,267✔
3918
  SArray *pArray = NULL;
14,267✔
3919
  void   *pIter = NULL;
14,267✔
3920
  int64_t curMs = taosGetTimestampMs();
14,267✔
3921

3922
  SBalanceVgroupReq req = {0};
14,267✔
3923
  if (tDeserializeSBalanceVgroupReq(pReq->pCont, pReq->contLen, &req) != 0) {
14,267✔
3924
    code = TSDB_CODE_INVALID_MSG;
×
3925
    goto _OVER;
×
3926
  }
3927

3928
  mInfo("start to balance vgroup");
14,267✔
3929
  if ((code = mndCheckOperPrivilege(pMnode, pReq->info.conn.user, MND_OPER_BALANCE_VGROUP)) != 0) {
14,267✔
3930
    goto _OVER;
349✔
3931
  }
3932

3933
  if (sdbGetSize(pMnode->pSdb, SDB_MOUNT) > 0) {
13,918✔
3934
    code = TSDB_CODE_MND_MOUNT_NOT_EMPTY;
×
3935
    goto _OVER;
×
3936
  }
3937

3938
  while (1) {
42,398✔
3939
    SDnodeObj *pDnode = NULL;
56,316✔
3940
    pIter = sdbFetch(pMnode->pSdb, SDB_DNODE, pIter, (void **)&pDnode);
56,316✔
3941
    if (pIter == NULL) break;
56,316✔
3942
    if (!mndIsDnodeOnline(pDnode, curMs)) {
43,874✔
3943
      sdbCancelFetch(pMnode->pSdb, pIter);
1,476✔
3944
      code = TSDB_CODE_MND_HAS_OFFLINE_DNODE;
1,476✔
3945
      mError("failed to balance vgroup since %s, dnode:%d", terrstr(), pDnode->id);
1,476✔
3946
      sdbRelease(pMnode->pSdb, pDnode);
1,476✔
3947
      goto _OVER;
1,476✔
3948
    }
3949

3950
    sdbRelease(pMnode->pSdb, pDnode);
42,398✔
3951
  }
3952

3953
  pArray = mndBuildDnodesArray(pMnode, 0, NULL);
12,442✔
3954
  if (pArray == NULL) {
12,442✔
3955
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
3956
    if (terrno != 0) code = terrno;
×
3957
    goto _OVER;
×
3958
  }
3959

3960
  if (taosArrayGetSize(pArray) < 2) {
12,442✔
3961
    mInfo("no need to balance vgroup since dnode num less than 2");
×
3962
    code = 0;
×
3963
  } else {
3964
    code = mndBalanceVgroup(pMnode, pReq, pArray);
12,442✔
3965
  }
3966

3967
  auditRecord(pReq, pMnode->clusterId, "balanceVgroup", "", "", req.sql, req.sqlLen);
12,442✔
3968

3969
_OVER:
14,267✔
3970
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
14,267✔
3971
    mError("failed to balance vgroup since %s", tstrerror(code));
4,795✔
3972
  }
3973

3974
  taosArrayDestroy(pArray);
14,267✔
3975
  tFreeSBalanceVgroupReq(&req);
14,267✔
3976
  TAOS_RETURN(code);
14,267✔
3977
}
3978

3979
bool mndVgroupInDb(SVgObj *pVgroup, int64_t dbUid) { return !pVgroup->isTsma && pVgroup->dbUid == dbUid; }
95,585,819✔
3980

3981
bool mndVgroupInDnode(SVgObj *pVgroup, int32_t dnodeId) {
9,752✔
3982
  for (int i = 0; i < pVgroup->replica; i++) {
24,364✔
3983
    if (pVgroup->vnodeGid[i].dnodeId == dnodeId) return true;
20,707✔
3984
  }
3985
  return false;
3,657✔
3986
}
3987

3988
static void *mndBuildCompactVnodeReq(SMnode *pMnode, SDbObj *pDb, SVgObj *pVgroup, int32_t *pContLen, int64_t compactTs,
132,575✔
3989
                                     STimeWindow tw, bool metaOnly, bool force, ETsdbOpType type,
3990
                                     ETriggerType triggerType) {
3991
  SCompactVnodeReq compactReq = {0};
132,575✔
3992
  compactReq.dbUid = pDb->uid;
132,575✔
3993
  compactReq.compactStartTime = compactTs;
132,575✔
3994
  compactReq.tw = tw;
132,575✔
3995
  compactReq.metaOnly = metaOnly;
132,575✔
3996
  compactReq.force = force;
132,575✔
3997
  compactReq.optrType = type;
132,575✔
3998
  compactReq.triggerType = triggerType;
132,575✔
3999
  tstrncpy(compactReq.db, pDb->name, TSDB_DB_FNAME_LEN);
132,575✔
4000

4001
  mInfo("vgId:%d, build compact vnode config req", pVgroup->vgId);
132,575✔
4002
  int32_t contLen = tSerializeSCompactVnodeReq(NULL, 0, &compactReq);
132,575✔
4003
  if (contLen < 0) {
132,575✔
4004
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
4005
    return NULL;
×
4006
  }
4007
  contLen += sizeof(SMsgHead);
132,575✔
4008

4009
  void *pReq = taosMemoryMalloc(contLen);
132,575✔
4010
  if (pReq == NULL) {
132,575✔
4011
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
4012
    return NULL;
×
4013
  }
4014

4015
  SMsgHead *pHead = pReq;
132,575✔
4016
  pHead->contLen = htonl(contLen);
132,575✔
4017
  pHead->vgId = htonl(pVgroup->vgId);
132,575✔
4018

4019
  if (tSerializeSCompactVnodeReq((char *)pReq + sizeof(SMsgHead), contLen, &compactReq) < 0) {
132,575✔
4020
    taosMemoryFree(pReq);
×
4021
    terrno = TSDB_CODE_OUT_OF_MEMORY;
×
4022
    return NULL;
×
4023
  }
4024
  *pContLen = contLen;
132,575✔
4025
  return pReq;
132,575✔
4026
}
4027

4028
static int32_t mndAddCompactVnodeAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int64_t compactTs,
67,184✔
4029
                                        STimeWindow tw, bool metaOnly, bool force, ETsdbOpType type,
4030
                                        ETriggerType triggerType) {
4031
  int32_t      code = 0;
67,184✔
4032
  STransAction action = {0};
67,184✔
4033
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
67,184✔
4034

4035
  int32_t contLen = 0;
67,184✔
4036
  void   *pReq =
4037
      mndBuildCompactVnodeReq(pMnode, pDb, pVgroup, &contLen, compactTs, tw, metaOnly, force, type, triggerType);
67,184✔
4038
  if (pReq == NULL) {
67,184✔
4039
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
4040
    if (terrno != 0) code = terrno;
×
4041
    TAOS_RETURN(code);
×
4042
  }
4043

4044
  action.pCont = pReq;
67,184✔
4045
  action.contLen = contLen;
67,184✔
4046
  action.msgType = TDMT_VND_COMPACT;
67,184✔
4047

4048
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
67,184✔
4049
    taosMemoryFree(pReq);
×
4050
    TAOS_RETURN(code);
×
4051
  }
4052

4053
  TAOS_RETURN(code);
67,184✔
4054
}
4055

4056
int32_t mndBuildCompactVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int64_t compactTs,
67,184✔
4057
                                    STimeWindow tw, bool metaOnly, bool force, ETsdbOpType type,
4058
                                    ETriggerType triggerType) {
4059
  TAOS_CHECK_RETURN(
67,184✔
4060
      mndAddCompactVnodeAction(pMnode, pTrans, pDb, pVgroup, compactTs, tw, metaOnly, force, type, triggerType));
4061
  return 0;
67,184✔
4062
}
4063

4064
int32_t mndBuildTrimVgroupAction(SMnode *pMnode, STrans *pTrans, SDbObj *pDb, SVgObj *pVgroup, int64_t startTs,
65,391✔
4065
                                 STimeWindow tw, ETsdbOpType type, ETriggerType triggerType) {
4066
  int32_t      code = 0;
65,391✔
4067
  STransAction action = {0};
65,391✔
4068
  action.epSet = mndGetVgroupEpset(pMnode, pVgroup);
65,391✔
4069

4070
  int32_t contLen = 0;
65,391✔
4071
  // reuse SCompactVnodeReq as SVTrimDbReq
4072
  void *pReq = mndBuildCompactVnodeReq(pMnode, pDb, pVgroup, &contLen, startTs, tw, false, false, type, triggerType);
65,391✔
4073
  if (pReq == NULL) {
65,391✔
4074
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
4075
    if (terrno != 0) code = terrno;
×
4076
    TAOS_RETURN(code);
×
4077
  }
4078

4079
  action.pCont = pReq;
65,391✔
4080
  action.contLen = contLen;
65,391✔
4081
  action.msgType = TDMT_VND_TRIM;
65,391✔
4082

4083
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
65,391✔
4084
    taosMemoryFree(pReq);
×
4085
    TAOS_RETURN(code);
×
4086
  }
4087

4088
  TAOS_RETURN(code);
65,391✔
4089
}
4090

4091
static int32_t mndProcessSetVgroupKeepVersionReq(SRpcMsg *pReq) {
1,194✔
4092
  SMnode *pMnode = pReq->info.node;
1,194✔
4093
  int32_t code = TSDB_CODE_SUCCESS;
1,194✔
4094
  STrans *pTrans = NULL;
1,194✔
4095
  SVgObj *pVgroup = NULL;
1,194✔
4096

4097
  SMndSetVgroupKeepVersionReq req = {0};
1,194✔
4098
  if (tDeserializeSMndSetVgroupKeepVersionReq(pReq->pCont, pReq->contLen, &req) != 0) {
1,194✔
4099
    code = TSDB_CODE_INVALID_MSG;
×
4100
    goto _OVER;
×
4101
  }
4102

4103
  mInfo("start to set vgroup keep version, vgId:%d, keepVersion:%" PRId64, req.vgId, req.keepVersion);
1,194✔
4104

4105
  // Check permission
4106
  if ((code = mndCheckOperPrivilege(pMnode, pReq->info.conn.user, MND_OPER_WRITE_DB)) != 0) {
1,194✔
4107
    goto _OVER;
×
4108
  }
4109

4110
  // Get vgroup
4111
  pVgroup = mndAcquireVgroup(pMnode, req.vgId);
1,194✔
4112
  if (pVgroup == NULL) {
1,194✔
4113
    code = TSDB_CODE_MND_VGROUP_NOT_EXIST;
×
4114
    mError("vgId:%d not exist, failed to set keep version", req.vgId);
×
4115
    goto _OVER;
×
4116
  }
4117

4118
  // Create transaction
4119
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_NOTHING, pReq, "set-vgroup-keep-version");
1,194✔
4120
  if (pTrans == NULL) {
1,194✔
4121
    code = terrno != 0 ? terrno : TSDB_CODE_MND_RETURN_VALUE_NULL;
×
4122
    mndReleaseVgroup(pMnode, pVgroup);
×
4123
    goto _OVER;
×
4124
  }
4125

4126
  mndTransSetSerial(pTrans);
1,194✔
4127
  mInfo("trans:%d, used to set vgroup keep version, vgId:%d keepVersion:%" PRId64, pTrans->id, req.vgId,
1,194✔
4128
        req.keepVersion);
4129

4130
  // Update SVgObj's keepVersion in mnode
4131
  SVgObj newVgroup = {0};
1,194✔
4132
  memcpy(&newVgroup, pVgroup, sizeof(SVgObj));
1,194✔
4133
  newVgroup.keepVersion = req.keepVersion;
1,194✔
4134
  newVgroup.keepVersionTime = taosGetTimestampMs();
1,194✔
4135

4136
  // Add prepare log for SDB vgroup update (execute in PREPARE stage, before redo actions)
4137
  SSdbRaw *pCommitRaw = mndVgroupActionEncode(&newVgroup);
1,194✔
4138
  if (pCommitRaw == NULL) {
1,194✔
4139
    code = TSDB_CODE_OUT_OF_MEMORY;
×
4140
    mndReleaseVgroup(pMnode, pVgroup);
×
4141
    goto _OVER;
×
4142
  }
4143
  if (mndTransAppendCommitlog(pTrans, pCommitRaw) != 0) {
1,194✔
4144
    code = terrno;
×
4145
    sdbFreeRaw(pCommitRaw);
×
4146
    mndReleaseVgroup(pMnode, pVgroup);
×
4147
    goto _OVER;
×
4148
  }
4149
  if ((code = sdbSetRawStatus(pCommitRaw, SDB_STATUS_READY)) != 0) {
1,194✔
4150
    mError("vgId:%d, failed to set raw status to ready, error:%s, line:%d", pVgroup->vgId, tstrerror(code), __LINE__);
×
4151
    sdbFreeRaw(pCommitRaw);
×
4152
    mndReleaseVgroup(pMnode, pVgroup);
×
4153
    goto _OVER;
×
4154
  }
4155

4156
  // Prepare message for vnodes
4157
  SVndSetKeepVersionReq vndReq = {.keepVersion = req.keepVersion};
1,194✔
4158
  int32_t               reqLen = tSerializeSVndSetKeepVersionReq(NULL, 0, &vndReq);
1,194✔
4159
  int32_t               contLen = reqLen + sizeof(SMsgHead);
1,194✔
4160

4161
  // Send to all replicas of the vgroup
4162
  for (int32_t i = 0; i < pVgroup->replica; ++i) {
4,776✔
4163
    SMsgHead *pHead = taosMemoryMalloc(contLen);
3,582✔
4164
    if (pHead == NULL) {
3,582✔
4165
      code = TSDB_CODE_OUT_OF_MEMORY;
×
4166
      mndReleaseVgroup(pMnode, pVgroup);
×
4167
      goto _OVER;
×
4168
    }
4169

4170
    pHead->contLen = htonl(contLen);
3,582✔
4171
    pHead->vgId = htonl(pVgroup->vgId);
3,582✔
4172

4173
    if (tSerializeSVndSetKeepVersionReq((char *)pHead + sizeof(SMsgHead), reqLen, &vndReq) < 0) {
3,582✔
4174
      taosMemoryFree(pHead);
×
4175
      code = TSDB_CODE_OUT_OF_MEMORY;
×
4176
      mndReleaseVgroup(pMnode, pVgroup);
×
4177
      goto _OVER;
×
4178
    }
4179

4180
    // Get dnode and add action to transaction
4181
    SDnodeObj *pDnode = mndAcquireDnode(pMnode, pVgroup->vnodeGid[i].dnodeId);
3,582✔
4182
    if (pDnode == NULL) {
3,582✔
4183
      taosMemoryFree(pHead);
×
4184
      code = TSDB_CODE_MND_DNODE_NOT_EXIST;
×
4185
      mndReleaseVgroup(pMnode, pVgroup);
×
4186
      goto _OVER;
×
4187
    }
4188

4189
    STransAction action = {0};
3,582✔
4190
    action.epSet = mndGetDnodeEpset(pDnode);
3,582✔
4191
    mndReleaseDnode(pMnode, pDnode);
3,582✔
4192
    action.pCont = pHead;
3,582✔
4193
    action.contLen = contLen;
3,582✔
4194
    action.msgType = TDMT_VND_SET_KEEP_VERSION;
3,582✔
4195
    action.acceptableCode = TSDB_CODE_VND_STOPPED;
3,582✔
4196

4197
    if (mndTransAppendRedoAction(pTrans, &action) != 0) {
3,582✔
4198
      taosMemoryFree(pHead);
×
4199
      code = terrno;
×
4200
      mndReleaseVgroup(pMnode, pVgroup);
×
4201
      goto _OVER;
×
4202
    }
4203
  }
4204

4205
  mndReleaseVgroup(pMnode, pVgroup);
1,194✔
4206

4207
  // Prepare and execute transaction
4208
  if ((code = mndTransPrepare(pMnode, pTrans)) != 0) {
1,194✔
4209
    goto _OVER;
×
4210
  }
4211

4212
  code = TSDB_CODE_ACTION_IN_PROGRESS;
1,194✔
4213

4214
_OVER:
1,194✔
4215
  if (pTrans != NULL) mndTransDrop(pTrans);
1,194✔
4216

4217
  return code;
1,194✔
4218
}
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc