• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #5005

26 Mar 2026 12:51PM UTC coverage: 72.152% (-0.2%) from 72.338%
#5005

push

travis-ci

web-flow
merge: from main to 3.0 branch #34951

512 of 851 new or added lines in 47 files covered. (60.16%)

6189 existing lines in 147 files now uncovered.

253282 of 351039 relevant lines covered (72.15%)

132156710.33 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

78.57
/source/dnode/mnode/impl/src/mndMnode.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15

16
#define _DEFAULT_SOURCE
17
#include "audit.h"
18
#include "mndCluster.h"
19
#include "mndDnode.h"
20
#include "mndMnode.h"
21
#include "mndPrivilege.h"
22
#include "mndShow.h"
23
#include "mndSync.h"
24
#include "mndTrans.h"
25
#include "tmisce.h"
26

27
#define MNODE_VER_NUMBER   2
28
#define MNODE_RESERVE_SIZE 64
29

30
static int32_t  mndCreateDefaultMnode(SMnode *pMnode);
31
static SSdbRaw *mndMnodeActionEncode(SMnodeObj *pObj);
32
static SSdbRow *mndMnodeActionDecode(SSdbRaw *pRaw);
33
static int32_t  mndMnodeActionInsert(SSdb *pSdb, SMnodeObj *pObj);
34
static int32_t  mndMnodeActionDelete(SSdb *pSdb, SMnodeObj *pObj);
35
static int32_t  mndMnodeActionUpdate(SSdb *pSdb, SMnodeObj *pOld, SMnodeObj *pNew);
36
static int32_t  mndProcessCreateMnodeReq(SRpcMsg *pReq);
37
static int32_t  mndProcessAlterMnodeReq(SRpcMsg *pReq);
38
static int32_t  mndProcessDropMnodeReq(SRpcMsg *pReq);
39
static int32_t  mndRetrieveMnodes(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows);
40
static void     mndCancelGetNextMnode(SMnode *pMnode, void *pIter);
41
static void     mndReloadSyncConfig(SMnode *pMnode);
42

43
int32_t mndInitMnode(SMnode *pMnode) {
453,244✔
44
  SSdbTable table = {
453,244✔
45
      .sdbType = SDB_MNODE,
46
      .keyType = SDB_KEY_INT32,
47
      .deployFp = (SdbDeployFp)mndCreateDefaultMnode,
48
      .encodeFp = (SdbEncodeFp)mndMnodeActionEncode,
49
      .decodeFp = (SdbDecodeFp)mndMnodeActionDecode,
50
      .insertFp = (SdbInsertFp)mndMnodeActionInsert,
51
      .updateFp = (SdbUpdateFp)mndMnodeActionUpdate,
52
      .deleteFp = (SdbDeleteFp)mndMnodeActionDelete,
53
  };
54

55
  mndSetMsgHandle(pMnode, TDMT_MND_CREATE_MNODE, mndProcessCreateMnodeReq);
453,244✔
56
  mndSetMsgHandle(pMnode, TDMT_DND_CREATE_MNODE_RSP, mndTransProcessRsp);
453,244✔
57
  mndSetMsgHandle(pMnode, TDMT_DND_ALTER_MNODE_TYPE_RSP, mndTransProcessRsp);
453,244✔
58
  mndSetMsgHandle(pMnode, TDMT_MND_ALTER_MNODE, mndProcessAlterMnodeReq);
453,244✔
59
  mndSetMsgHandle(pMnode, TDMT_MND_ALTER_MNODE_RSP, mndTransProcessRsp);
453,244✔
60
  mndSetMsgHandle(pMnode, TDMT_MND_DROP_MNODE, mndProcessDropMnodeReq);
453,244✔
61
  mndSetMsgHandle(pMnode, TDMT_DND_DROP_MNODE_RSP, mndTransProcessRsp);
453,244✔
62

63
  mndAddShowRetrieveHandle(pMnode, TSDB_MGMT_TABLE_MNODE, mndRetrieveMnodes);
453,244✔
64
  mndAddShowFreeIterHandle(pMnode, TSDB_MGMT_TABLE_MNODE, mndCancelGetNextMnode);
453,244✔
65

66
  return sdbSetTable(pMnode->pSdb, table);
453,244✔
67
}
68

69
void mndCleanupMnode(SMnode *pMnode) {}
453,182✔
70

71
SMnodeObj *mndAcquireMnode(SMnode *pMnode, int32_t mnodeId) {
46,454,292✔
72
  terrno = 0;
46,454,292✔
73
  SMnodeObj *pObj = sdbAcquire(pMnode->pSdb, SDB_MNODE, &mnodeId);
46,454,292✔
74
  if (pObj == NULL && terrno == TSDB_CODE_SDB_OBJ_NOT_THERE) {
46,454,292✔
75
    terrno = TSDB_CODE_MND_MNODE_NOT_EXIST;
17,078,254✔
76
  }
77
  return pObj;
46,454,292✔
78
}
79

80
void mndReleaseMnode(SMnode *pMnode, SMnodeObj *pObj) {
29,329,476✔
81
  SSdb *pSdb = pMnode->pSdb;
29,329,476✔
82
  sdbRelease(pMnode->pSdb, pObj);
29,329,476✔
83
}
29,329,476✔
84

85
static int32_t mndCreateDefaultMnode(SMnode *pMnode) {
326,326✔
86
  int32_t   code = 0;
326,326✔
87
  SMnodeObj mnodeObj = {0};
326,326✔
88
  mnodeObj.id = 1;
326,326✔
89
  mnodeObj.createdTime = taosGetTimestampMs();
326,326✔
90
  mnodeObj.updateTime = mnodeObj.createdTime;
326,326✔
91

92
  SSdbRaw *pRaw = mndMnodeActionEncode(&mnodeObj);
326,326✔
93
  if (pRaw == NULL) {
326,326✔
94
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
95
    if (terrno != 0) code = terrno;
×
96
    return -1;
×
97
  }
98
  TAOS_CHECK_RETURN(sdbSetRawStatus(pRaw, SDB_STATUS_READY));
326,326✔
99

100
  mInfo("mnode:%d, will be created when deploying, raw:%p", mnodeObj.id, pRaw);
326,326✔
101

102
  STrans *pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_GLOBAL, NULL, "create-mnode");
326,326✔
103
  if (pTrans == NULL) {
326,326✔
104
    sdbFreeRaw(pRaw);
×
105
    mError("mnode:%d, failed to create since %s", mnodeObj.id, terrstr());
×
106
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
107
    if (terrno != 0) code = terrno;
×
108
    return -1;
×
109
  }
110
  mInfo("trans:%d, used to create mnode:%d", pTrans->id, mnodeObj.id);
326,326✔
111

112
  if ((code = mndTransAppendCommitlog(pTrans, pRaw)) != 0) {
326,326✔
113
    mError("trans:%d, failed to append commit log since %s", pTrans->id, terrstr());
×
114
    mndTransDrop(pTrans);
×
115
    TAOS_RETURN(code);
×
116
  }
117
  TAOS_CHECK_RETURN(sdbSetRawStatus(pRaw, SDB_STATUS_READY));
326,326✔
118

119
  if ((code = mndTransPrepare(pMnode, pTrans)) != 0) {
326,326✔
120
    mError("trans:%d, failed to prepare since %s", pTrans->id, terrstr());
×
121
    mndTransDrop(pTrans);
×
122
    return -1;
×
123
  }
124

125
  mndTransDrop(pTrans);
326,326✔
126
  TAOS_RETURN(code);
326,326✔
127
}
128

129
static SSdbRaw *mndMnodeActionEncode(SMnodeObj *pObj) {
1,324,795✔
130
  int32_t code = 0;
1,324,795✔
131
  int32_t lino = 0;
1,324,795✔
132
  terrno = TSDB_CODE_OUT_OF_MEMORY;
1,324,795✔
133

134
  SSdbRaw *pRaw = sdbAllocRaw(SDB_MNODE, MNODE_VER_NUMBER, sizeof(SMnodeObj) + MNODE_RESERVE_SIZE);
1,324,795✔
135
  if (pRaw == NULL) goto _OVER;
1,324,795✔
136

137
  int32_t dataPos = 0;
1,324,795✔
138
  SDB_SET_INT32(pRaw, dataPos, pObj->id, _OVER)
1,324,795✔
139
  SDB_SET_INT64(pRaw, dataPos, pObj->createdTime, _OVER)
1,324,795✔
140
  SDB_SET_INT64(pRaw, dataPos, pObj->updateTime, _OVER)
1,324,795✔
141
  SDB_SET_INT32(pRaw, dataPos, pObj->role, _OVER)
1,324,795✔
142
  SDB_SET_INT64(pRaw, dataPos, pObj->lastIndex, _OVER)
1,324,795✔
143
  SDB_SET_RESERVE(pRaw, dataPos, MNODE_RESERVE_SIZE, _OVER)
1,324,795✔
144

145
  terrno = 0;
1,324,795✔
146

147
_OVER:
1,324,795✔
148
  if (terrno != 0) {
1,324,795✔
149
    mError("mnode:%d, failed to encode to raw:%p since %s", pObj->id, pRaw, terrstr());
×
150
    sdbFreeRaw(pRaw);
×
151
    return NULL;
×
152
  }
153

154
  mTrace("mnode:%d, encode to raw:%p, row:%p", pObj->id, pRaw, pObj);
1,324,795✔
155
  return pRaw;
1,324,795✔
156
}
157

158
static SSdbRow *mndMnodeActionDecode(SSdbRaw *pRaw) {
582,342✔
159
  int32_t code = 0;
582,342✔
160
  int32_t lino = 0;
582,342✔
161
  terrno = TSDB_CODE_OUT_OF_MEMORY;
582,342✔
162
  SSdbRow   *pRow = NULL;
582,342✔
163
  SMnodeObj *pObj = NULL;
582,342✔
164

165
  int8_t sver = 0;
582,342✔
166
  if (sdbGetRawSoftVer(pRaw, &sver) != 0) return NULL;
582,342✔
167

168
  if (sver != 1 && sver != 2) {
582,342✔
169
    terrno = TSDB_CODE_SDB_INVALID_DATA_VER;
×
170
    goto _OVER;
×
171
  }
172

173
  pRow = sdbAllocRow(sizeof(SMnodeObj));
582,342✔
174
  if (pRow == NULL) goto _OVER;
582,342✔
175

176
  pObj = sdbGetRowObj(pRow);
582,342✔
177
  if (pObj == NULL) goto _OVER;
582,342✔
178

179
  int32_t dataPos = 0;
582,342✔
180
  SDB_GET_INT32(pRaw, dataPos, &pObj->id, _OVER)
582,342✔
181
  SDB_GET_INT64(pRaw, dataPos, &pObj->createdTime, _OVER)
582,342✔
182
  SDB_GET_INT64(pRaw, dataPos, &pObj->updateTime, _OVER)
582,342✔
183
  if (sver >= 2) {
582,342✔
184
    SDB_GET_INT32(pRaw, dataPos, &pObj->role, _OVER)
582,342✔
185
    SDB_GET_INT64(pRaw, dataPos, &pObj->lastIndex, _OVER)
582,342✔
186
  }
187
  SDB_GET_RESERVE(pRaw, dataPos, MNODE_RESERVE_SIZE, _OVER)
582,342✔
188

189
  terrno = 0;
582,342✔
190

191
_OVER:
582,342✔
192
  if (terrno != 0) {
582,342✔
193
    mError("mnode:%d, failed to decode from raw:%p since %s", pObj == NULL ? 0 : pObj->id, pRaw, terrstr());
×
194
    taosMemoryFreeClear(pRow);
×
195
    return NULL;
×
196
  }
197

198
  mTrace("mnode:%d, decode from raw:%p, row:%p", pObj->id, pRaw, pObj);
582,342✔
199
  return pRow;
582,342✔
200
}
201

202
static int32_t mndMnodeActionInsert(SSdb *pSdb, SMnodeObj *pObj) {
546,029✔
203
  int32_t code = 0;
546,029✔
204
  mTrace("mnode:%d, perform insert action, row:%p", pObj->id, pObj);
546,029✔
205
  pObj->pDnode = sdbAcquireNotReadyObj(pSdb, SDB_DNODE, &pObj->id);
546,029✔
206
  if (pObj->pDnode == NULL) {
546,029✔
207
    mError("mnode:%d, failed to perform insert action since %s", pObj->id, terrstr());
×
208
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
209
    if (terrno != 0) code = terrno;
×
210
    int32_t code = 0;
×
211
  }
212

213
  pObj->syncState = TAOS_SYNC_STATE_OFFLINE;
546,029✔
214
  mndReloadSyncConfig(pSdb->pMnode);
546,029✔
215
  TAOS_RETURN(code);
546,029✔
216
}
217

218
static int32_t mndMnodeActionDelete(SSdb *pSdb, SMnodeObj *pObj) {
582,296✔
219
  mTrace("mnode:%d, perform delete action, row:%p", pObj->id, pObj);
582,296✔
220
  if (pObj->pDnode != NULL) {
582,296✔
221
    sdbRelease(pSdb, pObj->pDnode);
545,983✔
222
    pObj->pDnode = NULL;
545,983✔
223
  }
224

225
  return 0;
582,296✔
226
}
227

228
static int32_t mndMnodeActionUpdate(SSdb *pSdb, SMnodeObj *pOld, SMnodeObj *pNew) {
34,821✔
229
  mTrace("mnode:%d, perform update action, old row:%p new row:%p", pOld->id, pOld, pNew);
34,821✔
230
  pOld->role = pNew->role;
34,821✔
231
  pOld->updateTime = pNew->updateTime;
34,821✔
232
  pOld->lastIndex = pNew->lastIndex;
34,821✔
233
  mndReloadSyncConfig(pSdb->pMnode);
34,821✔
234

235
  return 0;
34,821✔
236
}
237

238
bool mndIsMnode(SMnode *pMnode, int32_t dnodeId) {
117,722,169✔
239
  SSdb *pSdb = pMnode->pSdb;
117,722,169✔
240

241
  SMnodeObj *pObj = sdbAcquire(pSdb, SDB_MNODE, &dnodeId);
117,722,169✔
242
  if (pObj == NULL) {
117,722,169✔
243
    return false;
83,316,518✔
244
  }
245

246
  sdbRelease(pSdb, pObj);
34,405,651✔
247
  return true;
34,405,651✔
248
}
249

250
void mndGetMnodeEpSet(SMnode *pMnode, SEpSet *pEpSet) {
32,267,007✔
251
  if (pMnode == NULL || pEpSet == NULL) {
32,267,007✔
UNCOV
252
    return;
×
253
  }
254

255
  syncGetRetryEpSet(pMnode->syncMgmt.sync, pEpSet);
32,267,784✔
256

257
  /*
258
  SSdb   *pSdb = pMnode->pSdb;
259
  int32_t totalMnodes = sdbGetSize(pSdb, SDB_MNODE);
260
  if (totalMnodes == 0) {
261
    syncGetRetryEpSet(pMnode->syncMgmt.sync, pEpSet);
262
    return;
263
  }
264

265
  void *pIter = NULL;
266
  while (1) {
267
    SMnodeObj *pObj = NULL;
268
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pObj);
269
    if (pIter == NULL) break;
270

271
    if (pObj->id == pMnode->selfDnodeId) {
272
      if (mndIsLeader(pMnode)) {
273
        pEpSet->inUse = pEpSet->numOfEps;
274
      } else {
275
        pEpSet->inUse = (pEpSet->numOfEps + 1) % totalMnodes;
276
        // pEpSet->inUse = 0;
277
      }
278
    }
279
    if (pObj->pDnode != NULL) {
280
      if (addEpIntoEpSet(pEpSet, pObj->pDnode->fqdn, pObj->pDnode->port) != 0) {
281
        mError("mnode:%d, failed to add ep:%s:%d into epset", pObj->id, pObj->pDnode->fqdn, pObj->pDnode->port);
282
      }
283
      sdbRelease(pSdb, pObj);
284
    }
285

286
    if (pEpSet->numOfEps == 0) {
287
      syncGetRetryEpSet(pMnode->syncMgmt.sync, pEpSet);
288
    }
289

290
    if (pEpSet->inUse >= pEpSet->numOfEps) {
291
      pEpSet->inUse = 0;
292
    }
293
    epsetSort(pEpSet);
294
  }
295
    */
296
}
297

298
static int32_t mndSetCreateMnodeRedoLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
15,115✔
299
  int32_t  code = 0;
15,115✔
300
  SSdbRaw *pRedoRaw = mndMnodeActionEncode(pObj);
15,115✔
301
  if (pRedoRaw == NULL) {
15,115✔
302
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
303
    if (terrno != 0) code = terrno;
×
304
    TAOS_RETURN(code);
×
305
  }
306
  TAOS_CHECK_RETURN(mndTransAppendRedolog(pTrans, pRedoRaw));
15,115✔
307
  TAOS_CHECK_RETURN(sdbSetRawStatus(pRedoRaw, SDB_STATUS_CREATING));
15,115✔
308
  TAOS_RETURN(code);
15,115✔
309
}
310

311
int32_t mndSetRestoreCreateMnodeRedoLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
×
312
  int32_t  code = 0;
×
313
  SSdbRaw *pRedoRaw = mndMnodeActionEncode(pObj);
×
314
  if (pRedoRaw == NULL) {
×
315
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
316
    if (terrno != 0) code = terrno;
×
317
    TAOS_RETURN(code);
×
318
  }
319
  TAOS_CHECK_RETURN(mndTransAppendRedolog(pTrans, pRedoRaw));
×
320
  TAOS_CHECK_RETURN(sdbSetRawStatus(pRedoRaw, SDB_STATUS_READY));
×
321
  TAOS_RETURN(code);
×
322
}
323

324
static int32_t mndSetCreateMnodeUndoLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
×
325
  int32_t  code = 0;
×
326
  SSdbRaw *pUndoRaw = mndMnodeActionEncode(pObj);
×
327
  if (pUndoRaw == NULL) {
×
328
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
329
    if (terrno != 0) code = terrno;
×
330
    TAOS_RETURN(code);
×
331
  }
332
  TAOS_CHECK_RETURN(mndTransAppendUndolog(pTrans, pUndoRaw));
×
333
  TAOS_CHECK_RETURN(sdbSetRawStatus(pUndoRaw, SDB_STATUS_DROPPED));
×
334
  TAOS_RETURN(code);
×
335
}
336

337
int32_t mndSetCreateMnodeCommitLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
15,328✔
338
  int32_t  code = 0;
15,328✔
339
  SSdbRaw *pCommitRaw = mndMnodeActionEncode(pObj);
15,328✔
340
  if (pCommitRaw == NULL) {
15,328✔
341
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
342
    if (terrno != 0) code = terrno;
×
343
    TAOS_RETURN(code);
×
344
  }
345
  TAOS_CHECK_RETURN(mndTransAppendCommitlog(pTrans, pCommitRaw));
15,328✔
346
  TAOS_CHECK_RETURN(sdbSetRawStatus(pCommitRaw, SDB_STATUS_READY));
15,328✔
347
  TAOS_RETURN(code);
15,328✔
348
}
349

350
static int32_t mndBuildCreateMnodeRedoAction(STrans *pTrans, SDCreateMnodeReq *pCreateReq, SEpSet *pCreateEpSet) {
15,328✔
351
  int32_t code = 0;
15,328✔
352
  int32_t contLen = tSerializeSDCreateMnodeReq(NULL, 0, pCreateReq);
15,328✔
353
  void   *pReq = taosMemoryMalloc(contLen);
15,328✔
354
  if (pReq == NULL) {
15,328✔
355
    code = terrno;
×
356
    return code;
×
357
  }
358
  code = tSerializeSDCreateMnodeReq(pReq, contLen, pCreateReq);
15,328✔
359
  if (code < 0) {
15,328✔
360
    taosMemoryFree(pReq);
×
361
    TAOS_RETURN(code);
×
362
  }
363

364
  STransAction action = {
15,328✔
365
      .epSet = *pCreateEpSet,
366
      .pCont = pReq,
367
      .contLen = contLen,
368
      .msgType = TDMT_DND_CREATE_MNODE,
369
      .acceptableCode = TSDB_CODE_MNODE_ALREADY_DEPLOYED,
370
      .groupId = -1,
371
  };
372

373
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
15,328✔
374
    taosMemoryFree(pReq);
×
375
    TAOS_RETURN(code);
×
376
  }
377
  TAOS_RETURN(code);
15,328✔
378
}
379

380
static int32_t mndBuildAlterMnodeTypeRedoAction(STrans *pTrans, SDAlterMnodeTypeReq *pAlterMnodeTypeReq,
15,328✔
381
                                                SEpSet *pAlterMnodeTypeEpSet) {
382
  int32_t code = 0;
15,328✔
383
  int32_t contLen = tSerializeSDCreateMnodeReq(NULL, 0, pAlterMnodeTypeReq);
15,328✔
384
  void   *pReq = taosMemoryMalloc(contLen);
15,328✔
385
  if (pReq == NULL) {
15,328✔
386
    code = terrno;
×
387
    return code;
×
388
  }
389
  code = tSerializeSDCreateMnodeReq(pReq, contLen, pAlterMnodeTypeReq);
15,328✔
390
  if (code < 0) {
15,328✔
391
    taosMemoryFree(pReq);
×
392
    TAOS_RETURN(code);
×
393
  }
394

395
  STransAction action = {
15,328✔
396
      .epSet = *pAlterMnodeTypeEpSet,
397
      .pCont = pReq,
398
      .contLen = contLen,
399
      .msgType = TDMT_DND_ALTER_MNODE_TYPE,
400
      .retryCode = TSDB_CODE_MNODE_NOT_CATCH_UP,
401
      .acceptableCode = TSDB_CODE_MNODE_ALREADY_IS_VOTER,
402
      .groupId = -1,
403
  };
404

405
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
15,328✔
406
    taosMemoryFree(pReq);
×
407
    TAOS_RETURN(code);
×
408
  }
409
  TAOS_RETURN(code);
15,328✔
410
}
411

412
static int32_t mndBuildAlterMnodeRedoAction(STrans *pTrans, SDCreateMnodeReq *pAlterReq, SEpSet *pAlterEpSet) {
×
413
  int32_t code = 0;
×
414
  int32_t contLen = tSerializeSDCreateMnodeReq(NULL, 0, pAlterReq);
×
415
  void   *pReq = taosMemoryMalloc(contLen);
×
416
  if (pReq == NULL) {
×
417
    code = terrno;
×
418
    return code;
×
419
  }
420
  code = tSerializeSDCreateMnodeReq(pReq, contLen, pAlterReq);
×
421
  if (code < 0) {
×
422
    taosMemoryFree(pReq);
×
423
    TAOS_RETURN(code);
×
424
  }
425
  STransAction action = {
×
426
      .epSet = *pAlterEpSet,
427
      .pCont = pReq,
428
      .contLen = contLen,
429
      .msgType = TDMT_MND_ALTER_MNODE,
430
      .acceptableCode = 0,
431
  };
432

433
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
×
434
    taosMemoryFree(pReq);
×
435
    TAOS_RETURN(code);
×
436
  }
437

438
  TAOS_RETURN(code);
×
439
}
440

441
static int32_t mndBuildDropMnodeRedoAction(STrans *pTrans, SDDropMnodeReq *pDropReq, SEpSet *pDroprEpSet) {
652✔
442
  int32_t code = 0;
652✔
443
  int32_t contLen = tSerializeSCreateDropMQSNodeReq(NULL, 0, pDropReq);
652✔
444
  void   *pReq = taosMemoryMalloc(contLen);
652✔
445
  if (pReq == NULL) {
652✔
446
    code = terrno;
×
447
    return code;
×
448
  }
449
  code = tSerializeSCreateDropMQSNodeReq(pReq, contLen, pDropReq);
652✔
450
  if (code < 0) {
652✔
451
    taosMemoryFree(pReq);
×
452
    TAOS_RETURN(code);
×
453
  }
454

455
  STransAction action = {
652✔
456
      .epSet = *pDroprEpSet,
457
      .pCont = pReq,
458
      .contLen = contLen,
459
      .msgType = TDMT_DND_DROP_MNODE,
460
      .acceptableCode = TSDB_CODE_MNODE_NOT_DEPLOYED,
461
      .groupId = -1,
462
  };
463

464
  if ((code = mndTransAppendRedoAction(pTrans, &action)) != 0) {
652✔
465
    taosMemoryFree(pReq);
×
466
    TAOS_RETURN(code);
×
467
  }
468
  TAOS_RETURN(code);
652✔
469
}
470

471
static int32_t mndSetCreateMnodeRedoActions(SMnode *pMnode, STrans *pTrans, SDnodeObj *pDnode, SMnodeObj *pObj) {
15,115✔
472
  SSdb            *pSdb = pMnode->pSdb;
15,115✔
473
  void            *pIter = NULL;
15,115✔
474
  int32_t          numOfReplicas = 0;
15,115✔
475
  int32_t          numOfLearnerReplicas = 0;
15,115✔
476
  SDCreateMnodeReq createReq = {0};
15,115✔
477
  SEpSet           createEpset = {0};
15,115✔
478

479
  while (1) {
22,482✔
480
    SMnodeObj *pMObj = NULL;
37,597✔
481
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
37,597✔
482
    if (pIter == NULL) break;
37,597✔
483

484
    if (pMObj->role == TAOS_SYNC_ROLE_VOTER) {
22,482✔
485
      createReq.replicas[numOfReplicas].id = pMObj->id;
22,482✔
486
      createReq.replicas[numOfReplicas].port = pMObj->pDnode->port;
22,482✔
487
      memcpy(createReq.replicas[numOfReplicas].fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
22,482✔
488
      numOfReplicas++;
22,482✔
489
    } else {
490
      createReq.learnerReplicas[numOfLearnerReplicas].id = pMObj->id;
×
491
      createReq.learnerReplicas[numOfLearnerReplicas].port = pMObj->pDnode->port;
×
492
      memcpy(createReq.learnerReplicas[numOfLearnerReplicas].fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
×
493
      numOfLearnerReplicas++;
×
494
    }
495

496
    sdbRelease(pSdb, pMObj);
22,482✔
497
  }
498

499
  createReq.replica = numOfReplicas;
15,115✔
500
  createReq.learnerReplica = numOfLearnerReplicas + 1;
15,115✔
501
  createReq.learnerReplicas[numOfLearnerReplicas].id = pDnode->id;
15,115✔
502
  createReq.learnerReplicas[numOfLearnerReplicas].port = pDnode->port;
15,115✔
503
  memcpy(createReq.learnerReplicas[numOfLearnerReplicas].fqdn, pDnode->fqdn, TSDB_FQDN_LEN);
15,115✔
504

505
  createReq.lastIndex = pObj->lastIndex;
15,115✔
506
  // Pass current sdb encryption status to new mnode
507
  createReq.encrypted = pSdb->encrypted ? 1 : 0;
15,115✔
508

509
  createEpset.inUse = 0;
15,115✔
510
  createEpset.numOfEps = 1;
15,115✔
511
  createEpset.eps[0].port = pDnode->port;
15,115✔
512
  memcpy(createEpset.eps[0].fqdn, pDnode->fqdn, TSDB_FQDN_LEN);
15,115✔
513

514
  TAOS_CHECK_RETURN(mndBuildCreateMnodeRedoAction(pTrans, &createReq, &createEpset));
15,115✔
515

516
  TAOS_RETURN(0);
15,115✔
517
}
518

519
int32_t mndSetRestoreCreateMnodeRedoActions(SMnode *pMnode, STrans *pTrans, SDnodeObj *pDnode, SMnodeObj *pObj) {
213✔
520
  SSdb            *pSdb = pMnode->pSdb;
213✔
521
  void            *pIter = NULL;
213✔
522
  SDCreateMnodeReq createReq = {0};
213✔
523
  SEpSet           createEpset = {0};
213✔
524

525
  while (1) {
639✔
526
    SMnodeObj *pMObj = NULL;
852✔
527
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
852✔
528
    if (pIter == NULL) break;
852✔
529

530
    if (pMObj->id == pDnode->id) {
639✔
531
      sdbRelease(pSdb, pMObj);
213✔
532
      continue;
213✔
533
    }
534

535
    if (pMObj->role == TAOS_SYNC_ROLE_VOTER) {
426✔
536
      createReq.replicas[createReq.replica].id = pMObj->id;
426✔
537
      createReq.replicas[createReq.replica].port = pMObj->pDnode->port;
426✔
538
      memcpy(createReq.replicas[createReq.replica].fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
426✔
539
      createReq.replica++;
426✔
540
    } else {
541
      createReq.learnerReplicas[createReq.learnerReplica].id = pMObj->id;
×
542
      createReq.learnerReplicas[createReq.learnerReplica].port = pMObj->pDnode->port;
×
543
      memcpy(createReq.learnerReplicas[createReq.learnerReplica].fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
×
544
      createReq.learnerReplica++;
×
545
    }
546

547
    sdbRelease(pSdb, pMObj);
426✔
548
  }
549

550
  createReq.learnerReplicas[createReq.learnerReplica].id = pDnode->id;
213✔
551
  createReq.learnerReplicas[createReq.learnerReplica].port = pDnode->port;
213✔
552
  memcpy(createReq.learnerReplicas[createReq.learnerReplica].fqdn, pDnode->fqdn, TSDB_FQDN_LEN);
213✔
553
  createReq.learnerReplica++;
213✔
554

555
  createReq.lastIndex = pObj->lastIndex;
213✔
556
  // Pass current sdb encryption status to restored mnode
557
  createReq.encrypted = pSdb->encrypted ? 1 : 0;
213✔
558

559
  createEpset.inUse = 0;
213✔
560
  createEpset.numOfEps = 1;
213✔
561
  createEpset.eps[0].port = pDnode->port;
213✔
562
  memcpy(createEpset.eps[0].fqdn, pDnode->fqdn, TSDB_FQDN_LEN);
213✔
563

564
  TAOS_CHECK_RETURN(mndBuildCreateMnodeRedoAction(pTrans, &createReq, &createEpset));
213✔
565

566
  TAOS_RETURN(0);
213✔
567
}
568

569
static int32_t mndSetAlterMnodeTypeRedoActions(SMnode *pMnode, STrans *pTrans, SDnodeObj *pDnode, SMnodeObj *pObj) {
15,115✔
570
  SSdb               *pSdb = pMnode->pSdb;
15,115✔
571
  void               *pIter = NULL;
15,115✔
572
  SDAlterMnodeTypeReq alterReq = {0};
15,115✔
573
  SEpSet              createEpset = {0};
15,115✔
574

575
  while (1) {
22,482✔
576
    SMnodeObj *pMObj = NULL;
37,597✔
577
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
37,597✔
578
    if (pIter == NULL) break;
37,597✔
579

580
    if (pMObj->role == TAOS_SYNC_ROLE_VOTER) {
22,482✔
581
      alterReq.replicas[alterReq.replica].id = pMObj->id;
22,482✔
582
      alterReq.replicas[alterReq.replica].port = pMObj->pDnode->port;
22,482✔
583
      memcpy(alterReq.replicas[alterReq.replica].fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
22,482✔
584
      alterReq.replica++;
22,482✔
585
    } else {
586
      alterReq.learnerReplicas[alterReq.learnerReplica].id = pMObj->id;
×
587
      alterReq.learnerReplicas[alterReq.learnerReplica].port = pMObj->pDnode->port;
×
588
      memcpy(alterReq.learnerReplicas[alterReq.learnerReplica].fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
×
589
      alterReq.learnerReplica++;
×
590
    }
591

592
    sdbRelease(pSdb, pMObj);
22,482✔
593
  }
594

595
  alterReq.replicas[alterReq.replica].id = pDnode->id;
15,115✔
596
  alterReq.replicas[alterReq.replica].port = pDnode->port;
15,115✔
597
  memcpy(alterReq.replicas[alterReq.replica].fqdn, pDnode->fqdn, TSDB_FQDN_LEN);
15,115✔
598
  alterReq.replica++;
15,115✔
599

600
  alterReq.lastIndex = pObj->lastIndex;
15,115✔
601
  // Pass current sdb encryption status to altered mnode
602
  alterReq.encrypted = pSdb->encrypted ? 1 : 0;
15,115✔
603

604
  createEpset.inUse = 0;
15,115✔
605
  createEpset.numOfEps = 1;
15,115✔
606
  createEpset.eps[0].port = pDnode->port;
15,115✔
607
  memcpy(createEpset.eps[0].fqdn, pDnode->fqdn, TSDB_FQDN_LEN);
15,115✔
608

609
  TAOS_CHECK_RETURN(mndBuildAlterMnodeTypeRedoAction(pTrans, &alterReq, &createEpset));
15,115✔
610

611
  TAOS_RETURN(0);
15,115✔
612
}
613

614
int32_t mndSetRestoreAlterMnodeTypeRedoActions(SMnode *pMnode, STrans *pTrans, SDnodeObj *pDnode, SMnodeObj *pObj) {
213✔
615
  SSdb               *pSdb = pMnode->pSdb;
213✔
616
  void               *pIter = NULL;
213✔
617
  SDAlterMnodeTypeReq alterReq = {0};
213✔
618
  SEpSet              createEpset = {0};
213✔
619

620
  while (1) {
639✔
621
    SMnodeObj *pMObj = NULL;
852✔
622
    pIter = sdbFetch(pSdb, SDB_MNODE, pIter, (void **)&pMObj);
852✔
623
    if (pIter == NULL) break;
852✔
624

625
    if (pMObj->id == pDnode->id) {
639✔
626
      sdbRelease(pSdb, pMObj);
213✔
627
      continue;
213✔
628
    }
629

630
    if (pMObj->role == TAOS_SYNC_ROLE_VOTER) {
426✔
631
      alterReq.replicas[alterReq.replica].id = pMObj->id;
426✔
632
      alterReq.replicas[alterReq.replica].port = pMObj->pDnode->port;
426✔
633
      memcpy(alterReq.replicas[alterReq.replica].fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
426✔
634
      alterReq.replica++;
426✔
635
    } else {
636
      alterReq.learnerReplicas[alterReq.learnerReplica].id = pMObj->id;
×
637
      alterReq.learnerReplicas[alterReq.learnerReplica].port = pMObj->pDnode->port;
×
638
      memcpy(alterReq.learnerReplicas[alterReq.learnerReplica].fqdn, pMObj->pDnode->fqdn, TSDB_FQDN_LEN);
×
639
      alterReq.learnerReplica++;
×
640
    }
641

642
    sdbRelease(pSdb, pMObj);
426✔
643
  }
644

645
  alterReq.replicas[alterReq.replica].id = pDnode->id;
213✔
646
  alterReq.replicas[alterReq.replica].port = pDnode->port;
213✔
647
  memcpy(alterReq.replicas[alterReq.replica].fqdn, pDnode->fqdn, TSDB_FQDN_LEN);
213✔
648
  alterReq.replica++;
213✔
649

650
  alterReq.lastIndex = pObj->lastIndex;
213✔
651
  // Pass current sdb encryption status to restored and altered mnode
652
  alterReq.encrypted = pSdb->encrypted ? 1 : 0;
213✔
653

654
  createEpset.inUse = 0;
213✔
655
  createEpset.numOfEps = 1;
213✔
656
  createEpset.eps[0].port = pDnode->port;
213✔
657
  memcpy(createEpset.eps[0].fqdn, pDnode->fqdn, TSDB_FQDN_LEN);
213✔
658

659
  TAOS_CHECK_RETURN(mndBuildAlterMnodeTypeRedoAction(pTrans, &alterReq, &createEpset));
213✔
660

661
  TAOS_RETURN(0);
213✔
662
}
663

664
static int32_t mndCreateMnode(SMnode *pMnode, SRpcMsg *pReq, SDnodeObj *pDnode, SMCreateMnodeReq *pCreate) {
15,115✔
665
  int32_t code = -1;
15,115✔
666

667
  STrans *pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_GLOBAL, pReq, "create-mnode");
15,115✔
668
  if (pTrans == NULL) {
15,115✔
669
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
670
    if (terrno != 0) code = terrno;
×
671
    goto _OVER;
×
672
  }
673
  mndTransSetSerial(pTrans);
15,115✔
674
  mInfo("trans:%d, used to create mnode:%d", pTrans->id, pCreate->dnodeId);
15,115✔
675
  TAOS_CHECK_GOTO(mndTransCheckConflict(pMnode, pTrans), NULL, _OVER);
15,115✔
676

677
  SMnodeObj mnodeObj = {0};
15,115✔
678
  mnodeObj.id = pDnode->id;
15,115✔
679
  mnodeObj.createdTime = taosGetTimestampMs();
15,115✔
680
  mnodeObj.updateTime = mnodeObj.createdTime;
15,115✔
681
  mnodeObj.role = TAOS_SYNC_ROLE_LEARNER;
15,115✔
682
  mnodeObj.lastIndex = pMnode->applied;
15,115✔
683

684
  TAOS_CHECK_GOTO(mndSetCreateMnodeRedoActions(pMnode, pTrans, pDnode, &mnodeObj), NULL, _OVER);
15,115✔
685
  TAOS_CHECK_GOTO(mndSetCreateMnodeRedoLogs(pMnode, pTrans, &mnodeObj), NULL, _OVER);
15,115✔
686

687
  SMnodeObj mnodeLeaderObj = {0};
15,115✔
688
  mnodeLeaderObj.id = pDnode->id;
15,115✔
689
  mnodeLeaderObj.createdTime = taosGetTimestampMs();
15,115✔
690
  mnodeLeaderObj.updateTime = mnodeLeaderObj.createdTime;
15,115✔
691
  mnodeLeaderObj.role = TAOS_SYNC_ROLE_VOTER;
15,115✔
692
  mnodeLeaderObj.lastIndex = pMnode->applied + 1;
15,115✔
693

694
  TAOS_CHECK_GOTO(mndSetAlterMnodeTypeRedoActions(pMnode, pTrans, pDnode, &mnodeLeaderObj), NULL, _OVER);
15,115✔
695
  TAOS_CHECK_GOTO(mndSetCreateMnodeCommitLogs(pMnode, pTrans, &mnodeLeaderObj), NULL, _OVER);
15,115✔
696
  TAOS_CHECK_GOTO(mndTransPrepare(pMnode, pTrans), NULL, _OVER);
15,115✔
697

698
  code = 0;
15,115✔
699

700
_OVER:
15,115✔
701
  mndTransDrop(pTrans);
15,115✔
702
  TAOS_RETURN(code);
15,115✔
703
}
704

705
static int32_t mndProcessCreateMnodeReq(SRpcMsg *pReq) {
22,009✔
706
  SMnode          *pMnode = pReq->info.node;
22,009✔
707
  int32_t          code = -1;
22,009✔
708
  SMnodeObj       *pObj = NULL;
22,009✔
709
  SDnodeObj       *pDnode = NULL;
22,009✔
710
  SMCreateMnodeReq createReq = {0};
22,009✔
711
  int64_t          tss = taosGetTimestampMs();
22,009✔
712

713
  TAOS_CHECK_GOTO(tDeserializeSCreateDropMQSNodeReq(pReq->pCont, pReq->contLen, &createReq), NULL, _OVER);
22,009✔
714

715
  mInfo("mnode:%d, start to create", createReq.dnodeId);
22,009✔
716
  TAOS_CHECK_GOTO(mndCheckOperPrivilege(pMnode, RPC_MSG_USER(pReq), RPC_MSG_TOKEN(pReq), MND_OPER_CREATE_MNODE), NULL, _OVER);
22,009✔
717

718
  pObj = mndAcquireMnode(pMnode, createReq.dnodeId);
22,009✔
719
  if (pObj != NULL) {
22,009✔
720
    code = TSDB_CODE_MND_MNODE_ALREADY_EXIST;
4,478✔
721
    goto _OVER;
4,478✔
722
  } else if (terrno != TSDB_CODE_MND_MNODE_NOT_EXIST) {
17,531✔
723
    goto _OVER;
×
724
  }
725

726
  pDnode = mndAcquireDnode(pMnode, createReq.dnodeId);
17,531✔
727
  if (pDnode == NULL) {
17,531✔
728
    code = TSDB_CODE_MND_DNODE_NOT_EXIST;
1,136✔
729
    goto _OVER;
1,136✔
730
  }
731

732
  if (sdbGetSize(pMnode->pSdb, SDB_MNODE) >= 3) {
16,395✔
733
    code = TSDB_CODE_MND_TOO_MANY_MNODES;
284✔
734
    goto _OVER;
284✔
735
  }
736

737
  if (!mndIsDnodeOnline(pDnode, taosGetTimestampMs())) {
16,111✔
738
    code = TSDB_CODE_DNODE_OFFLINE;
996✔
739
    goto _OVER;
996✔
740
  }
741

742
  code = mndCreateMnode(pMnode, pReq, pDnode, &createReq);
15,115✔
743
  if (code == 0) code = TSDB_CODE_ACTION_IN_PROGRESS;
15,115✔
744

745
  if (tsAuditLevel >= AUDIT_LEVEL_SYSTEM) {
15,115✔
746
    char    obj[40] = {0};
15,115✔
747
    int32_t bytes = snprintf(obj, sizeof(obj), "%d", createReq.dnodeId);
15,115✔
748
    if ((uint32_t)bytes < sizeof(obj)) {
15,115✔
749
      int64_t tse = taosGetTimestampMs();
15,115✔
750
      double  duration = (double)(tse - tss);
15,115✔
751
      duration = duration / 1000;
15,115✔
752
      auditRecord(pReq, pMnode->clusterId, "createMnode", "", obj, createReq.sql, createReq.sqlLen, duration, 0);
15,115✔
753
    } else {
754
      mError("mnode:%d, failed to audit create req since %s", createReq.dnodeId, tstrerror(TSDB_CODE_OUT_OF_RANGE));
×
755
    }
756
  }
757

758
_OVER:
22,009✔
759
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
22,009✔
760
    mError("mnode:%d, failed to create since %s", createReq.dnodeId, terrstr());
6,894✔
761
  }
762

763
  mndReleaseMnode(pMnode, pObj);
22,009✔
764
  mndReleaseDnode(pMnode, pDnode);
22,009✔
765
  tFreeSMCreateQnodeReq(&createReq);
22,009✔
766

767
  TAOS_RETURN(code);
22,009✔
768
}
769

770
static int32_t mndSetDropMnodeRedoLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
652✔
771
  int32_t  code = 0;
652✔
772
  SSdbRaw *pRedoRaw = mndMnodeActionEncode(pObj);
652✔
773
  if (pRedoRaw == NULL) {
652✔
774
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
775
    if (terrno != 0) code = terrno;
×
776
    TAOS_RETURN(code);
×
777
  }
778
  TAOS_CHECK_RETURN(mndTransAppendGroupRedolog(pTrans, pRedoRaw, -1));
652✔
779
  TAOS_CHECK_RETURN(sdbSetRawStatus(pRedoRaw, SDB_STATUS_DROPPING));
652✔
780
  TAOS_RETURN(code);
652✔
781
}
782

783
static int32_t mndSetDropMnodeCommitLogs(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj) {
652✔
784
  int32_t  code = 0;
652✔
785
  SSdbRaw *pCommitRaw = mndMnodeActionEncode(pObj);
652✔
786
  if (pCommitRaw == NULL) {
652✔
787
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
788
    if (terrno != 0) code = terrno;
×
789
    TAOS_RETURN(code);
×
790
  }
791
  TAOS_CHECK_RETURN(mndTransAppendCommitlog(pTrans, pCommitRaw));
652✔
792
  TAOS_CHECK_RETURN(sdbSetRawStatus(pCommitRaw, SDB_STATUS_DROPPED));
652✔
793
  TAOS_RETURN(code);
652✔
794
}
795

796
static int32_t mndSetDropMnodeRedoActions(SMnode *pMnode, STrans *pTrans, SDnodeObj *pDnode, SMnodeObj *pObj,
652✔
797
                                          bool force) {
798
  int32_t        code = 0;
652✔
799
  SSdb          *pSdb = pMnode->pSdb;
652✔
800
  void          *pIter = NULL;
652✔
801
  SDDropMnodeReq dropReq = {0};
652✔
802
  SEpSet         dropEpSet = {0};
652✔
803

804
  dropReq.dnodeId = pDnode->id;
652✔
805
  dropEpSet.numOfEps = 1;
652✔
806
  dropEpSet.eps[0].port = pDnode->port;
652✔
807
  memcpy(dropEpSet.eps[0].fqdn, pDnode->fqdn, TSDB_FQDN_LEN);
652✔
808

809
  int32_t totalMnodes = sdbGetSize(pSdb, SDB_MNODE);
652✔
810
  if (totalMnodes == 2) {
652✔
811
    if (force) {
309✔
812
      mError("cant't force drop dnode, since a mnode on it and replica is 2");
×
813
      code = TSDB_CODE_MNODE_ONLY_TWO_MNODE;
×
814
      TAOS_RETURN(code);
×
815
    }
816
    mInfo("vgId:1, has %d mnodes, exec redo log first", totalMnodes);
309✔
817
    TAOS_CHECK_RETURN(mndSetDropMnodeRedoLogs(pMnode, pTrans, pObj));
309✔
818
    if (!force) {
309✔
819
      TAOS_CHECK_RETURN(mndBuildDropMnodeRedoAction(pTrans, &dropReq, &dropEpSet));
309✔
820
    }
821
  } else if (totalMnodes == 3) {
343✔
822
    mInfo("vgId:1, has %d mnodes, exec redo action first", totalMnodes);
343✔
823
    if (!force) {
343✔
824
      TAOS_CHECK_RETURN(mndBuildDropMnodeRedoAction(pTrans, &dropReq, &dropEpSet));
343✔
825
    }
826
    TAOS_CHECK_RETURN(mndSetDropMnodeRedoLogs(pMnode, pTrans, pObj));
343✔
827
  } else {
828
    TAOS_RETURN(-1);
×
829
  }
830

831
  TAOS_RETURN(code);
652✔
832
}
833

834
int32_t mndSetDropMnodeInfoToTrans(SMnode *pMnode, STrans *pTrans, SMnodeObj *pObj, bool force) {
652✔
835
  if (pObj == NULL) return 0;
652✔
836
  pObj->lastIndex = pMnode->applied;
652✔
837
  TAOS_CHECK_RETURN(mndSetDropMnodeRedoActions(pMnode, pTrans, pObj->pDnode, pObj, force));
652✔
838
  TAOS_CHECK_RETURN(mndSetDropMnodeCommitLogs(pMnode, pTrans, pObj));
652✔
839
  return 0;
652✔
840
}
841

842
static int32_t mndDropMnode(SMnode *pMnode, SRpcMsg *pReq, SMnodeObj *pObj) {
419✔
843
  int32_t code = -1;
419✔
844
  STrans *pTrans = NULL;
419✔
845

846
  pTrans = mndTransCreate(pMnode, TRN_POLICY_RETRY, TRN_CONFLICT_GLOBAL, pReq, "drop-mnode");
419✔
847
  if (pTrans == NULL) {
419✔
848
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
×
849
    if (terrno != 0) code = terrno;
×
850
    goto _OVER;
×
851
  }
852
  mndTransSetSerial(pTrans);
419✔
853
  mInfo("trans:%d, used to drop mnode:%d", pTrans->id, pObj->id);
419✔
854
  TAOS_CHECK_GOTO(mndTransCheckConflict(pMnode, pTrans), NULL, _OVER);
419✔
855

856
  TAOS_CHECK_GOTO(mndSetDropMnodeInfoToTrans(pMnode, pTrans, pObj, false), NULL, _OVER);
419✔
857
  TAOS_CHECK_GOTO(mndTransPrepare(pMnode, pTrans), NULL, _OVER);
419✔
858

859
  code = 0;
419✔
860

861
_OVER:
419✔
862
  mndTransDrop(pTrans);
419✔
863
  TAOS_RETURN(code);
419✔
864
}
865

866
static int32_t mndProcessDropMnodeReq(SRpcMsg *pReq) {
2,508✔
867
  SMnode        *pMnode = pReq->info.node;
2,508✔
868
  int32_t        code = -1;
2,508✔
869
  SMnodeObj     *pObj = NULL;
2,508✔
870
  SMDropMnodeReq dropReq = {0};
2,508✔
871
  int64_t        tss = taosGetTimestampMs();
2,508✔
872

873
  TAOS_CHECK_GOTO(tDeserializeSCreateDropMQSNodeReq(pReq->pCont, pReq->contLen, &dropReq), NULL, _OVER);
2,508✔
874

875
  mInfo("mnode:%d, start to drop", dropReq.dnodeId);
2,508✔
876
  TAOS_CHECK_GOTO(mndCheckOperPrivilege(pMnode, RPC_MSG_USER(pReq), RPC_MSG_TOKEN(pReq), MND_OPER_DROP_MNODE), NULL, _OVER);
2,508✔
877

878
  if (dropReq.dnodeId <= 0) {
2,508✔
879
    code = TSDB_CODE_INVALID_MSG;
×
880
    goto _OVER;
×
881
  }
882

883
  pObj = mndAcquireMnode(pMnode, dropReq.dnodeId);
2,508✔
884
  if (pObj == NULL) {
2,508✔
885
    code = TSDB_CODE_MND_RETURN_VALUE_NULL;
1,006✔
886
    if (terrno != 0) code = terrno;
1,006✔
887
    goto _OVER;
1,006✔
888
  }
889

890
  if (pMnode->selfDnodeId == dropReq.dnodeId) {
1,502✔
891
    code = TSDB_CODE_MND_CANT_DROP_LEADER;
797✔
892
    goto _OVER;
797✔
893
  }
894

895
  if (sdbGetSize(pMnode->pSdb, SDB_MNODE) <= 1) {
705✔
896
    code = TSDB_CODE_MND_TOO_FEW_MNODES;
×
897
    goto _OVER;
×
898
  }
899

900
  if (!mndIsDnodeOnline(pObj->pDnode, taosGetTimestampMs())) {
705✔
901
    code = TSDB_CODE_DNODE_OFFLINE;
286✔
902
    goto _OVER;
286✔
903
  }
904

905
  code = mndDropMnode(pMnode, pReq, pObj);
419✔
906
  if (code == 0) code = TSDB_CODE_ACTION_IN_PROGRESS;
419✔
907

908
  if (tsAuditLevel >= AUDIT_LEVEL_SYSTEM) {
419✔
909
    char obj[40] = {0};
419✔
910
    (void)snprintf(obj, sizeof(obj), "%d", dropReq.dnodeId);
419✔
911

912
    int64_t tse = taosGetTimestampMs();
419✔
913
    double  duration = (double)(tse - tss);
419✔
914
    duration = duration / 1000;
419✔
915
    auditRecord(pReq, pMnode->clusterId, "dropMnode", "", obj, dropReq.sql, dropReq.sqlLen, duration, 0);
419✔
916
  }
917

918
_OVER:
2,508✔
919
  if (code != 0 && code != TSDB_CODE_ACTION_IN_PROGRESS) {
2,508✔
920
    mError("mnode:%d, failed to drop since %s", dropReq.dnodeId, terrstr());
2,089✔
921
  }
922

923
  mndReleaseMnode(pMnode, pObj);
2,508✔
924
  tFreeSMCreateQnodeReq(&dropReq);
2,508✔
925
  TAOS_RETURN(code);
2,508✔
926
}
927

928
static int32_t mndRetrieveMnodes(SRpcMsg *pReq, SShowObj *pShow, SSDataBlock *pBlock, int32_t rows) {
338,184✔
929
  SMnode    *pMnode = pReq->info.node;
338,184✔
930
  SSdb      *pSdb = pMnode->pSdb;
338,184✔
931
  int32_t    numOfRows = 0;
338,184✔
932
  int32_t    cols = 0;
338,184✔
933
  SMnodeObj *pObj = NULL;
338,184✔
934
  SMnodeObj *pSelfObj = NULL;
338,184✔
935
  ESdbStatus objStatus = 0;
338,184✔
936
  char      *pWrite;
937
  int64_t    curMs = taosGetTimestampMs();
338,184✔
938
  int        code = 0;
338,184✔
939

940
  pSelfObj = sdbAcquire(pSdb, SDB_MNODE, &pMnode->selfDnodeId);
338,184✔
941
  if (pSelfObj == NULL) {
338,184✔
942
    mError("mnode:%d, failed to acquire self %s", pMnode->selfDnodeId, terrstr());
×
943
    goto _out;
×
944
  }
945

946
  while (numOfRows < rows) {
722,421✔
947
    pShow->pIter = sdbFetchAll(pSdb, SDB_MNODE, pShow->pIter, (void **)&pObj, &objStatus, true);
722,421✔
948
    if (pShow->pIter == NULL) break;
722,421✔
949

950
    cols = 0;
384,237✔
951
    SColumnInfoData *pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
384,237✔
952
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&pObj->id, false);
384,237✔
953
    if (code != 0) {
384,237✔
954
      mError("mnode:%d, failed to set col data val since %s", pObj->id, tstrerror(code));
×
955
      sdbRelease(pSdb, pObj);
×
956
      goto _out;
×
957
    }
958

959
    char b1[TSDB_EP_LEN + VARSTR_HEADER_SIZE] = {0};
384,237✔
960
    STR_WITH_MAXSIZE_TO_VARSTR(b1, pObj->pDnode->ep, TSDB_EP_LEN + VARSTR_HEADER_SIZE);
384,237✔
961

962
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
384,237✔
963
    code = colDataSetVal(pColInfo, numOfRows, b1, false);
384,237✔
964
    if (code != 0) {
384,237✔
965
      mError("mnode:%d, failed to set col data val since %s", pObj->id, tstrerror(code));
×
966
      sdbCancelFetch(pSdb, pShow->pIter);
×
967
      sdbRelease(pSdb, pObj);
×
968
      goto _out;
×
969
    }
970

971
    char role[20] = "offline";
384,237✔
972
    if (pObj->id == pMnode->selfDnodeId) {
384,237✔
973
      snprintf(role, sizeof(role), "%s%s", syncStr(TAOS_SYNC_STATE_LEADER), pMnode->restored ? "" : "*");
338,184✔
974
    }
975
    bool isDnodeOnline = mndIsDnodeOnline(pObj->pDnode, curMs);
384,237✔
976
    if (isDnodeOnline) {
384,237✔
977
      tstrncpy(role, syncStr(pObj->syncState), sizeof(role));
378,583✔
978
      if (pObj->syncState == TAOS_SYNC_STATE_LEADER && pObj->id != pMnode->selfDnodeId) {
378,583✔
979
        tstrncpy(role, syncStr(TAOS_SYNC_STATE_ERROR), sizeof(role));
×
980
        mError("mnode:%d, is leader too", pObj->id);
×
981
      }
982
    }
983
    char b2[12 + VARSTR_HEADER_SIZE] = {0};
384,237✔
984
    STR_WITH_MAXSIZE_TO_VARSTR(b2, role, pShow->pMeta->pSchemas[cols].bytes);
384,237✔
985
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
384,237✔
986
    code = colDataSetVal(pColInfo, numOfRows, (const char *)b2, false);
384,237✔
987
    if (code != 0) goto _err;
384,237✔
988

989
    const char *status = "ready";
384,237✔
990
    if (objStatus == SDB_STATUS_CREATING) status = "creating";
384,237✔
991
    if (objStatus == SDB_STATUS_DROPPING) status = "dropping";
384,237✔
992
    if (!isDnodeOnline) status = "offline";
384,237✔
993
    char b3[9 + VARSTR_HEADER_SIZE] = {0};
384,237✔
994
    STR_WITH_MAXSIZE_TO_VARSTR(b3, status, pShow->pMeta->pSchemas[cols].bytes);
384,237✔
995
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
384,237✔
996
    code = colDataSetVal(pColInfo, numOfRows, (const char *)b3, false);
384,237✔
997
    if (code != 0) goto _err;
384,237✔
998

999
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
384,237✔
1000
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&pObj->createdTime, false);
384,237✔
1001
    if (code != 0) goto _err;
384,237✔
1002

1003
    int64_t roleTimeMs = (isDnodeOnline) ? pObj->roleTimeMs : 0;
384,237✔
1004
    pColInfo = taosArrayGet(pBlock->pDataBlock, cols++);
384,237✔
1005
    code = colDataSetVal(pColInfo, numOfRows, (const char *)&roleTimeMs, false);
384,237✔
1006
    if (code != 0) goto _err;
384,237✔
1007

1008
    numOfRows++;
384,237✔
1009
    sdbRelease(pSdb, pObj);
384,237✔
1010
  }
1011

1012
  pShow->numOfRows += numOfRows;
338,184✔
1013

1014
_out:
338,184✔
1015
  sdbRelease(pSdb, pSelfObj);
338,184✔
1016
  return numOfRows;
338,184✔
1017

1018
_err:
×
1019
  mError("mnode:%d, failed to set col data val since %s", pObj->id, tstrerror(code));
×
1020
  sdbCancelFetch(pSdb, pShow->pIter);
×
1021
  sdbRelease(pSdb, pObj);
×
1022
  sdbRelease(pSdb, pSelfObj);
×
1023
  return numOfRows;
×
1024
}
1025

1026
static void mndCancelGetNextMnode(SMnode *pMnode, void *pIter) {
×
1027
  SSdb *pSdb = pMnode->pSdb;
×
1028
  sdbCancelFetchByType(pSdb, pIter, SDB_MNODE);
×
1029
}
×
1030

1031
static int32_t mndProcessAlterMnodeReq(SRpcMsg *pReq) {
×
1032
#if 1
1033
  return 0;
×
1034
#else
1035
  int32_t         code = 0;
1036
  SMnode         *pMnode = pReq->info.node;
1037
  SDAlterMnodeReq alterReq = {0};
1038

1039
  TAOS_CHECK_RETURN(tDeserializeSDCreateMnodeReq(pReq->pCont, pReq->contLen, &alterReq));
1040

1041
  SMnodeOpt option = {.deploy = true, .numOfReplicas = alterReq.replica, .selfIndex = -1};
1042
  memcpy(option.replicas, alterReq.replicas, sizeof(alterReq.replicas));
1043
  for (int32_t i = 0; i < option.numOfReplicas; ++i) {
1044
    if (alterReq.replicas[i].id == pMnode->selfDnodeId) {
1045
      option.selfIndex = i;
1046
    }
1047
  }
1048

1049
  if (option.selfIndex == -1) {
1050
    mInfo("alter mnode not processed since selfIndex is -1", terrstr());
1051
    return 0;
1052
  }
1053

1054
  if ((code = mndWriteFile(pMnode->path, &option)) != 0) {
1055
    mError("failed to write mnode file since %s", terrstr());
1056
    TAOS_RETURN(code);
1057
  }
1058

1059
  SSyncCfg cfg = {.replicaNum = alterReq.replica, .myIndex = -1};
1060
  for (int32_t i = 0; i < alterReq.replica; ++i) {
1061
    SNodeInfo *pNode = &cfg.nodeInfo[i];
1062
    tstrncpy(pNode->nodeFqdn, alterReq.replicas[i].fqdn, sizeof(pNode->nodeFqdn));
1063
    pNode->nodePort = alterReq.replicas[i].port;
1064
    if (alterReq.replicas[i].id == pMnode->selfDnodeId) {
1065
      cfg.myIndex = i;
1066
    }
1067
  }
1068

1069
  if (cfg.myIndex == -1) {
1070
    mError("failed to alter mnode since myindex is -1");
1071
    return -1;
1072
  } else {
1073
    mInfo("start to alter mnode sync, replica:%d myIndex:%d", cfg.replicaNum, cfg.myIndex);
1074
    for (int32_t i = 0; i < alterReq.replica; ++i) {
1075
      SNodeInfo *pNode = &cfg.nodeInfo[i];
1076
      mInfo("index:%d, fqdn:%s port:%d", i, pNode->nodeFqdn, pNode->nodePort);
1077
    }
1078
  }
1079

1080
  code = syncReconfig(pMnode->syncMgmt.sync, &cfg);
1081
  if (code != 0) {
1082
    mError("failed to sync reconfig since %s", terrstr());
1083
  } else {
1084
    mInfo("alter mnode sync success");
1085
  }
1086

1087
  TAOS_RETURN(code);
1088
#endif
1089
}
1090

1091
static void mndReloadSyncConfig(SMnode *pMnode) {
580,850✔
1092
  SSdb      *pSdb = pMnode->pSdb;
580,850✔
1093
  SMnodeObj *pObj = NULL;
580,850✔
1094
  ESdbStatus objStatus = 0;
580,850✔
1095
  void      *pIter = NULL;
580,850✔
1096
  int32_t    updatingMnodes = 0;
580,850✔
1097
  int32_t    readyMnodes = 0;
580,850✔
1098
  int32_t    code = 0;
580,850✔
1099
  SSyncCfg   cfg = {
580,850✔
1100
        .myIndex = -1,
1101
        .lastIndex = 0,
1102
  };
1103
  SyncIndex maxIndex = 0;
580,850✔
1104

1105
  while (1) {
1106
    pIter = sdbFetchAll(pSdb, SDB_MNODE, pIter, (void **)&pObj, &objStatus, false);
1,349,270✔
1107
    if (pIter == NULL) break;
1,349,270✔
1108
    if (objStatus == SDB_STATUS_CREATING || objStatus == SDB_STATUS_DROPPING) {
768,420✔
1109
      mInfo("vgId:1, has updating mnode:%d, status:%s", pObj->id, sdbStatusName(objStatus));
49,114✔
1110
      updatingMnodes++;
49,114✔
1111
    }
1112
    if (objStatus == SDB_STATUS_READY) {
768,420✔
1113
      mInfo("vgId:1, has ready mnode:%d, status:%s", pObj->id, sdbStatusName(objStatus));
719,306✔
1114
      readyMnodes++;
719,306✔
1115
    }
1116

1117
    if (objStatus == SDB_STATUS_READY || objStatus == SDB_STATUS_CREATING) {
768,420✔
1118
      SNodeInfo *pNode = &cfg.nodeInfo[cfg.totalReplicaNum];
766,774✔
1119
      pNode->nodeId = pObj->pDnode->id;
766,774✔
1120
      pNode->clusterId = mndGetClusterId(pMnode);
766,774✔
1121
      pNode->nodePort = pObj->pDnode->port;
766,774✔
1122
      pNode->nodeRole = pObj->role;
766,774✔
1123
      tstrncpy(pNode->nodeFqdn, pObj->pDnode->fqdn, TSDB_FQDN_LEN);
766,774✔
1124
      code = tmsgUpdateDnodeInfo(&pNode->nodeId, &pNode->clusterId, pNode->nodeFqdn, &pNode->nodePort);
766,774✔
1125
      if (code != 0) {
766,774✔
1126
        mError("mnode:%d, failed to update dnode info since %s", pObj->id, terrstr());
×
1127
      }
1128
      mInfo("vgId:1, ep:%s:%u dnode:%d", pNode->nodeFqdn, pNode->nodePort, pNode->nodeId);
766,774✔
1129
      if (pObj->pDnode->id == pMnode->selfDnodeId) {
766,774✔
1130
        cfg.myIndex = cfg.totalReplicaNum;
517,008✔
1131
      }
1132
      if (pNode->nodeRole == TAOS_SYNC_ROLE_VOTER) {
766,774✔
1133
        cfg.replicaNum++;
719,306✔
1134
      }
1135
      cfg.totalReplicaNum++;
766,774✔
1136
      if (pObj->lastIndex > cfg.lastIndex) {
766,774✔
1137
        cfg.lastIndex = pObj->lastIndex;
183,519✔
1138
      }
1139
    }
1140

1141
    if (objStatus == SDB_STATUS_DROPPING) {
768,420✔
1142
      if (pObj->lastIndex > cfg.lastIndex) {
1,646✔
1143
        cfg.lastIndex = pObj->lastIndex;
1,646✔
1144
      }
1145
    }
1146

1147
    mInfo("vgId:1, mnode:%d, role:%d, lastIndex:%" PRId64, pObj->id, pObj->role, pObj->lastIndex);
768,420✔
1148

1149
    sdbReleaseLock(pSdb, pObj, false);
768,420✔
1150
  }
1151

1152
  // if (readyMnodes <= 0 || updatingMnodes <= 0) {
1153
  //   mInfo("vgId:1, mnode sync not reconfig since readyMnodes:%d updatingMnodes:%d", readyMnodes, updatingMnodes);
1154
  //   return;
1155
  // }
1156

1157
  if (cfg.myIndex == -1) {
580,850✔
1158
#if 1
1159
    mInfo("vgId:1, mnode sync not reconfig since selfIndex is -1");
63,842✔
1160
#else
1161
    // cannot reconfig because the leader may fail to elect after reboot
1162
    mInfo("vgId:1, mnode sync not reconfig since selfIndex is -1, do sync stop oper");
1163
    syncStop(pMnode->syncMgmt.sync);
1164
#endif
1165
    return;
63,842✔
1166
  }
1167

1168
  if (pMnode->syncMgmt.sync > 0) {
517,008✔
1169
    mInfo("vgId:1, mnode sync reconfig, totalReplica:%d replica:%d myIndex:%d", cfg.totalReplicaNum, cfg.replicaNum,
408,019✔
1170
          cfg.myIndex);
1171

1172
    for (int32_t i = 0; i < cfg.totalReplicaNum; ++i) {
944,199✔
1173
      SNodeInfo *pNode = &cfg.nodeInfo[i];
536,180✔
1174
      mInfo("vgId:1, index:%d, ep:%s:%u dnode:%d cluster:%" PRId64 " role:%d", i, pNode->nodeFqdn, pNode->nodePort,
536,180✔
1175
            pNode->nodeId, pNode->clusterId, pNode->nodeRole);
1176
    }
1177

1178
    int32_t code = syncReconfig(pMnode->syncMgmt.sync, &cfg);
408,019✔
1179
    if (code != 0) {
408,019✔
1180
      mError("vgId:1, mnode sync reconfig failed since %s", terrstr());
×
1181
    } else {
1182
      mInfo("vgId:1, mnode sync reconfig success");
408,019✔
1183
    }
1184
  }
1185
}
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc