• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #3664

20 Mar 2025 09:19AM UTC coverage: 35.63%. First build
#3664

push

travis-ci

web-flow
Merge 8112ba125 into 9b7434d0a

72910 of 278358 branches covered (26.19%)

Branch coverage included in aggregate %.

195 of 257 new or added lines in 17 files covered. (75.88%)

125571 of 278710 relevant lines covered (45.05%)

1012723.65 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

52.12
/source/dnode/mgmt/node_mgmt/src/dmEnv.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15

16
#define _DEFAULT_SOURCE
17
// clang-format off
18
#include "dmMgmt.h"
19
#include "audit.h"
20
#include "libs/function/tudf.h"
21
#include "tgrant.h"
22
#include "tcompare.h"
23
#include "tcs.h"
24
#include "tanalytics.h"
25
// clang-format on
26

27
#define DM_INIT_AUDIT()                       \
28
  do {                                        \
29
    auditCfg.port = tsMonitorPort;            \
30
    auditCfg.server = tsMonitorFqdn;          \
31
    auditCfg.comp = tsMonitorComp;            \
32
    if ((code = auditInit(&auditCfg)) != 0) { \
33
      return code;                            \
34
    }                                         \
35
  } while (0)
36

37
static SDnode globalDnode = {0};
38

39
SDnode *dmInstance() { return &globalDnode; }
6,256✔
40

41
static int32_t dmCheckRepeatInit(SDnode *pDnode) {
73✔
42
  int32_t code = 0;
73✔
43
  if (atomic_val_compare_exchange_8(&pDnode->once, DND_ENV_INIT, DND_ENV_READY) != DND_ENV_INIT) {
73!
44
    dError("env is already initialized");
×
45
    code = TSDB_CODE_REPEAT_INIT;
×
46
    return code;
×
47
  }
48
  return 0;
73✔
49
}
50

51
static int32_t dmInitSystem() {
73✔
52
  if (taosIgnSIGPIPE() != 0) {
73!
53
    dError("failed to ignore SIGPIPE");
×
54
  }
55

56
  if (taosBlockSIGPIPE() != 0) {
73!
57
    dError("failed to block SIGPIPE");
×
58
  }
59

60
  taosResolveCRC();
73✔
61
  return 0;
73✔
62
}
63

64
static int32_t dmInitMonitor() {
73✔
65
  int32_t code = 0;
73✔
66
  SMonCfg monCfg = {0};
73✔
67

68
  monCfg.maxLogs = tsMonitorMaxLogs;
73✔
69
  monCfg.port = tsMonitorPort;
73✔
70
  monCfg.server = tsMonitorFqdn;
73✔
71
  monCfg.comp = tsMonitorComp;
73✔
72
  if ((code = monInit(&monCfg)) != 0) {
73!
73
    dError("failed to init monitor since %s", tstrerror(code));
×
74
  }
75
  return code;
73✔
76
}
77

78
static int32_t dmInitAudit() {
73✔
79
  SAuditCfg auditCfg = {0};
73✔
80
  int32_t   code = 0;
73✔
81

82
  DM_INIT_AUDIT();
73!
83

84
  return 0;
73✔
85
}
86

87
static bool dmDataSpaceAvailable() {
73✔
88
  SDnode *pDnode = dmInstance();
73✔
89
  if (pDnode->pTfs) {
73!
90
    return tfsDiskSpaceAvailable(pDnode->pTfs, 0);
73✔
91
  }
92
  if (!osDataSpaceAvailable()) {
×
93
    dError("data disk space unavailable, i.e. %s", tsDataDir);
×
94
    return false;
×
95
  }
96
  return true;
×
97
}
98

99
static int32_t dmCheckDiskSpace() {
73✔
100
  // availability
101
  int32_t code = 0;
73✔
102
  code = osUpdate();
73✔
103
  if (code != 0) {
73!
104
    dError("failed to update os info since %s", tstrerror(code));
×
105
    code = 0;  // ignore the error, just log it
×
106
  }
107
  if (!dmDataSpaceAvailable()) {
73!
108
    code = TSDB_CODE_NO_DISKSPACE;
×
109
    return code;
×
110
  }
111
  if (!osLogSpaceAvailable()) {
73!
112
    dError("log disk space unavailable, i.e. %s", tsLogDir);
×
113
    code = TSDB_CODE_NO_DISKSPACE;
×
114
    return code;
×
115
  }
116
  if (!osTempSpaceAvailable()) {
73!
117
    dError("temp disk space unavailable, i.e. %s", tsTempDir);
×
118
    code = TSDB_CODE_NO_DISKSPACE;
×
119
    return code;
×
120
  }
121
  return code;
73✔
122
}
123

124
int32_t dmDiskInit() {
73✔
125
  SDnode  *pDnode = dmInstance();
73✔
126
  SDiskCfg dCfg = {.level = 0, .primary = 1, .disable = 0};
73✔
127
  tstrncpy(dCfg.dir, tsDataDir, TSDB_FILENAME_LEN);
73✔
128
  SDiskCfg *pDisks = tsDiskCfg;
73✔
129
  int32_t   numOfDisks = tsDiskCfgNum;
73✔
130
  if (numOfDisks <= 0 || pDisks == NULL) {
73!
131
    pDisks = &dCfg;
8✔
132
    numOfDisks = 1;
8✔
133
  }
134

135
  int32_t code = tfsOpen(pDisks, numOfDisks, &pDnode->pTfs);
73✔
136
  if (code != 0) {
73!
137
    dError("failed to init tfs since %s", tstrerror(code));
×
138
    TAOS_RETURN(code);
×
139
  }
140
  return 0;
73✔
141
}
142

143
int32_t dmDiskClose() {
21✔
144
  SDnode *pDnode = dmInstance();
21✔
145
  tfsClose(pDnode->pTfs);
21✔
146
  pDnode->pTfs = NULL;
21✔
147
  return 0;
21✔
148
}
149

150
static bool dmCheckDataDirVersion() {
73✔
151
  char checkDataDirJsonFileName[PATH_MAX] = {0};
73✔
152
  snprintf(checkDataDirJsonFileName, PATH_MAX, "%s/dnode/dnodeCfg.json", tsDataDir);
73✔
153
  if (taosCheckExistFile(checkDataDirJsonFileName)) {
73!
154
    dError("The default data directory %s contains old data of tdengine 2.x, please clear it before running!",
×
155
           tsDataDir);
156
    return false;
×
157
  }
158
  return true;
73✔
159
}
160

161
static int32_t dmCheckDataDirVersionWrapper() {
×
162
  if (!dmCheckDataDirVersion()) {
×
163
    return TSDB_CODE_INVALID_DATA_FMT;
×
164
  }
165
  return 0;
×
166
}
167

168
int32_t dmInit() {
73✔
169
  dInfo("start to init dnode env");
73!
170
  int32_t code = 0;
73✔
171
  if ((code = dmDiskInit()) != 0) return code;
73!
172
  if (!dmCheckDataDirVersion()) {
73!
173
    code = TSDB_CODE_INVALID_DATA_FMT;
×
174
    return code;
×
175
  }
176
  if ((code = dmCheckDiskSpace()) != 0) return code;
73!
177
  if ((code = dmCheckRepeatInit(dmInstance())) != 0) return code;
73!
178
  if ((code = dmInitSystem()) != 0) return code;
73!
179
  if ((code = dmInitMonitor()) != 0) return code;
73!
180
  if ((code = dmInitAudit()) != 0) return code;
73!
181
  if ((code = dmInitDnode(dmInstance())) != 0) return code;
73✔
182
  if ((code = InitRegexCache() != 0)) return code;
72!
183
#if defined(USE_S3)
184
  if ((code = tcsInit()) != 0) return code;
72!
185
#endif
186

187
  dInfo("dnode env is initialized");
72!
188
  return 0;
72✔
189
}
190

191
static int32_t dmCheckRepeatCleanup(SDnode *pDnode) {
29✔
192
  if (atomic_val_compare_exchange_8(&pDnode->once, DND_ENV_READY, DND_ENV_CLEANUP) != DND_ENV_READY) {
29✔
193
    dError("dnode env is already cleaned up");
8!
194
    return -1;
8✔
195
  }
196
  return 0;
21✔
197
}
198

199
void dmCleanup() {
29✔
200
  dDebug("start to cleanup dnode env");
29✔
201
  SDnode *pDnode = dmInstance();
29✔
202
  if (dmCheckRepeatCleanup(pDnode) != 0) return;
29✔
203
  dmCleanupDnode(pDnode);
21✔
204
  monCleanup();
21✔
205
  auditCleanup();
21✔
206
  syncCleanUp();
21✔
207
  walCleanUp();
21✔
208
  if (udfcClose() != 0) {
21!
209
    dError("failed to close udfc");
×
210
  }
211
  udfStopUdfd();
21✔
212
  taosAnalyticsCleanup();
21✔
213
  taosStopCacheRefreshWorker();
21✔
214
  (void)dmDiskClose();
21✔
215
  DestroyRegexCache();
21✔
216

217
#if defined(USE_S3)
218
  tcsUninit();
21✔
219
#endif
220

221
  dInfo("dnode env is cleaned up");
21!
222

223
  taosMemPoolClose(gMemPoolHandle);
21✔
224
  taosCleanupCfg();
21✔
225
  taosCloseLog();
21✔
226
}
227

228
void dmStop() {
21✔
229
  SDnode *pDnode = dmInstance();
21✔
230
  pDnode->stop = true;
21✔
231
}
21✔
232

233
int32_t dmRun() {
72✔
234
  SDnode *pDnode = dmInstance();
72✔
235
  return dmRunDnode(pDnode);
72✔
236
}
237

238
static int32_t dmProcessCreateNodeReq(EDndNodeType ntype, SRpcMsg *pMsg) {
6✔
239
  int32_t code = 0;
6✔
240
  SDnode *pDnode = dmInstance();
6✔
241

242
  SMgmtWrapper *pWrapper = dmAcquireWrapper(pDnode, ntype);
6✔
243
  if (pWrapper != NULL) {
6✔
244
    dmReleaseWrapper(pWrapper);
2✔
245
    switch (ntype) {
2!
246
      case MNODE:
×
247
        code = TSDB_CODE_MNODE_ALREADY_DEPLOYED;
×
248
        break;
×
249
      case QNODE:
2✔
250
        code = TSDB_CODE_QNODE_ALREADY_DEPLOYED;
2✔
251
        break;
2✔
252
      case SNODE:
×
253
        code = TSDB_CODE_SNODE_ALREADY_DEPLOYED;
×
254
        break;
×
NEW
255
      case XNODE:
×
NEW
256
        code = TSDB_CODE_XNODE_ALREADY_DEPLOYED;
×
257
        break;
258
      default:
2!
259
        code = TSDB_CODE_APP_ERROR;
2✔
260
    }
261
    dError("failed to create node since %s", tstrerror(code));
262
    return code;
4!
263
  }
264

4✔
265
  dInfo("start to process create-node-request");
4!
266

×
267
  pWrapper = &pDnode->wrappers[ntype];
×
268
  if (taosMkDir(pWrapper->path) != 0) {
×
269
    dmReleaseWrapper(pWrapper);
×
270
    code = terrno;
271
    dError("failed to create dir:%s since %s", pWrapper->path, tstrerror(code));
272
    return code;
4✔
273
  }
4✔
274

275
  (void)taosThreadMutexLock(&pDnode->mutex);
4!
276
  SMgmtInputOpt input = dmBuildMgmtInputOpt(pWrapper);
4✔
277

4✔
278
  dInfo("node:%s, start to create", pWrapper->name);
1!
279
  code = (*pWrapper->func.createFp)(&input, pMsg);
280
  if (code != 0) {
3!
281
    dError("node:%s, failed to create since %s", pWrapper->name, tstrerror(code));
3✔
282
  } else {
3!
283
    dInfo("node:%s, has been created", pWrapper->name);
3✔
284
    code = dmOpenNode(pWrapper);
285
    if (code == 0) {
3✔
286
      code = dmStartNode(pWrapper);
3✔
287
    }
288
    pWrapper->deployed = true;
289
    pWrapper->required = true;
4✔
290
  }
4✔
291

292
  (void)taosThreadMutexUnlock(&pDnode->mutex);
293
  return code;
×
294
}
×
295

×
296
static int32_t dmProcessAlterNodeTypeReq(EDndNodeType ntype, SRpcMsg *pMsg) {
297
  int32_t code = 0;
×
298
  SDnode *pDnode = dmInstance();
×
299

×
300
  SMgmtWrapper *pWrapper = dmAcquireWrapper(pDnode, ntype);
×
301
  if (pWrapper == NULL) {
302
    dError("fail to process alter node type since node not exist");
×
303
    return TSDB_CODE_INVALID_MSG;
304
  }
×
305
  dmReleaseWrapper(pWrapper);
306

×
307
  dInfo("node:%s, start to process alter-node-type-request", pWrapper->name);
308

×
309
  pWrapper = &pDnode->wrappers[ntype];
×
310

×
311
  if (pWrapper->func.nodeRoleFp != NULL) {
×
312
    ESyncRole role = (*pWrapper->func.nodeRoleFp)(pWrapper->pMgmt);
×
313
    dInfo("node:%s, checking node role:%d", pWrapper->name, role);
×
314
    if (role == TAOS_SYNC_ROLE_VOTER) {
×
315
      dError("node:%s, failed to alter node type since node already is role:%d", pWrapper->name, role);
316
      code = TSDB_CODE_MNODE_ALREADY_IS_VOTER;
317
      return code;
318
    }
×
319
  }
×
320

×
321
  if (pWrapper->func.isCatchUpFp != NULL) {
×
322
    dInfo("node:%s, checking node catch up", pWrapper->name);
×
323
    if ((*pWrapper->func.isCatchUpFp)(pWrapper->pMgmt) != 1) {
324
      code = TSDB_CODE_MNODE_NOT_CATCH_UP;
325
      return code;
326
    }
×
327
  }
328

×
329
  dInfo("node:%s, catched up leader, continue to process alter-node-type-request", pWrapper->name);
330

×
331
  (void)taosThreadMutexLock(&pDnode->mutex);
×
332

×
333
  dInfo("node:%s, stopping node", pWrapper->name);
×
334
  dmStopNode(pWrapper);
335
  dInfo("node:%s, closing node", pWrapper->name);
×
336
  dmCloseNode(pWrapper);
×
337

×
338
  pWrapper = &pDnode->wrappers[ntype];
×
339
  if (taosMkDir(pWrapper->path) != 0) {
×
340
    (void)taosThreadMutexUnlock(&pDnode->mutex);
×
341
    code = terrno;
342
    dError("failed to create dir:%s since %s", pWrapper->path, tstrerror(code));
343
    return code;
×
344
  }
345

×
346
  SMgmtInputOpt input = dmBuildMgmtInputOpt(pWrapper);
×
347

×
348
  dInfo("node:%s, start to create", pWrapper->name);
×
349
  code = (*pWrapper->func.createFp)(&input, pMsg);
350
  if (code != 0) {
×
351
    dError("node:%s, failed to create since %s", pWrapper->name, tstrerror(code));
×
352
  } else {
×
353
    dInfo("node:%s, has been created", pWrapper->name);
×
354
    code = dmOpenNode(pWrapper);
355
    if (code == 0) {
×
356
      code = dmStartNode(pWrapper);
×
357
    }
358
    pWrapper->deployed = true;
359
    pWrapper->required = true;
×
360
  }
×
361

362
  (void)taosThreadMutexUnlock(&pDnode->mutex);
363
  return code;
3✔
364
}
3✔
365

3✔
366
static int32_t dmProcessDropNodeReq(EDndNodeType ntype, SRpcMsg *pMsg) {
367
  int32_t code = 0;
3✔
368
  SDnode *pDnode = dmInstance();
3✔
369

2!
370
  SMgmtWrapper *pWrapper = dmAcquireWrapper(pDnode, ntype);
×
371
  if (pWrapper == NULL) {
×
372
    switch (ntype) {
×
373
      case MNODE:
2✔
374
        code = TSDB_CODE_MNODE_NOT_DEPLOYED;
2✔
375
        break;
2✔
376
      case QNODE:
×
377
        code = TSDB_CODE_QNODE_NOT_DEPLOYED;
×
378
        break;
×
379
      case SNODE:
×
380
        code = TSDB_CODE_SNODE_NOT_DEPLOYED;
×
381
        break;
382
      case XNODE:
383
        code = TSDB_CODE_XNODE_NOT_DEPLOYED;
2!
384
        break;
2✔
385
      default:
386
        code = TSDB_CODE_APP_ERROR;
387
    }
1✔
388

1✔
389
    dError("failed to drop node since %s", tstrerror(code));
390
    return terrno = code;
1!
391
  }
1✔
392

1!
393
  (void)taosThreadMutexLock(&pDnode->mutex);
×
394
  SMgmtInputOpt input = dmBuildMgmtInputOpt(pWrapper);
395

1!
396
  dInfo("node:%s, start to drop", pWrapper->name);
1✔
397
  code = (*pWrapper->func.dropFp)(&input, pMsg);
1✔
398
  if (code != 0) {
399
    dError("node:%s, failed to drop since %s", pWrapper->name, tstrerror(code));
400
  } else {
1✔
401
    dInfo("node:%s, has been dropped", pWrapper->name);
402
    pWrapper->required = false;
1!
403
    pWrapper->deployed = false;
1✔
404
  }
1✔
405

1✔
406
  dmReleaseWrapper(pWrapper);
407

1✔
408
  if (code == 0) {
1✔
409
    dmStopNode(pWrapper);
410
    dmCloseNode(pWrapper);
411
    taosRemoveDir(pWrapper->path);
484✔
412
  }
484✔
413
  (void)taosThreadMutexUnlock(&pDnode->mutex);
484✔
414
  return code;
484✔
415
}
484✔
416

484✔
417
SMgmtInputOpt dmBuildMgmtInputOpt(SMgmtWrapper *pWrapper) {
418
  SMgmtInputOpt opt = {
419
      .path = pWrapper->path,
420
      .name = pWrapper->name,
421
      .pTfs = pWrapper->pDnode->pTfs,
422
      .pData = &pWrapper->pDnode->data,
423
      .processCreateNodeFp = dmProcessCreateNodeReq,
424
      .processAlterNodeTypeFp = dmProcessAlterNodeTypeReq,
425
      .processDropNodeFp = dmProcessDropNodeReq,
426
      .sendMonitorReportFp = dmSendMonitorReport,
427
      .monitorCleanExpiredSamplesFp = dmMonitorCleanExpiredSamples,
428
      .sendAuditRecordFp = auditSendRecordsInBatch,
429
      .getVnodeLoadsFp = dmGetVnodeLoads,
430
      .getVnodeLoadsLiteFp = dmGetVnodeLoadsLite,
484✔
431
      .getMnodeLoadsFp = dmGetMnodeLoads,
484✔
432
      .getQnodeLoadsFp = dmGetQnodeLoads,
433
      .stopDnodeFp = dmStop,
434
  };
1,175✔
435

1,175✔
436
  opt.msgCb = dmGetMsgcb(pWrapper->pDnode);
1,175✔
437
  return opt;
1,175✔
438
}
1,175✔
439

1,175✔
440
void dmReportStartup(const char *pName, const char *pDesc) {
441
  SStartupInfo *pStartup = &(dmInstance()->startup);
×
442
  tstrncpy(pStartup->name, pName, TSDB_STEP_NAME_LEN);
443
  tstrncpy(pStartup->desc, pDesc, TSDB_STEP_DESC_LEN);
34✔
444
  dDebug("step:%s, %s", pStartup->name, pStartup->desc);
445
}
446

447
int64_t dmGetClusterId() { return globalDnode.data.clusterId; }
448

449
bool dmReadyForTest() { return dmInstance()->data.dnodeVer > 0; }
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc