• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #3548

04 Dec 2024 01:03PM UTC coverage: 59.846% (-0.8%) from 60.691%
#3548

push

travis-ci

web-flow
Merge pull request #29033 from taosdata/fix/calculate-vnode-memory-used

fix/calculate-vnode-memory-used

118484 of 254183 branches covered (46.61%)

Branch coverage included in aggregate %.

199691 of 277471 relevant lines covered (71.97%)

18794141.86 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

57.14
/source/dnode/mgmt/node_mgmt/src/dmEnv.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15

16
#define _DEFAULT_SOURCE
17
// clang-format off
18
#include "dmMgmt.h"
19
#include "audit.h"
20
#include "libs/function/tudf.h"
21
#include "tgrant.h"
22
#include "tcompare.h"
23
#include "tcs.h"
24
#include "tanalytics.h"
25
// clang-format on
26

27
#define DM_INIT_AUDIT()                       \
28
  do {                                        \
29
    auditCfg.port = tsMonitorPort;            \
30
    auditCfg.server = tsMonitorFqdn;          \
31
    auditCfg.comp = tsMonitorComp;            \
32
    if ((code = auditInit(&auditCfg)) != 0) { \
33
      return code;                            \
34
    }                                         \
35
  } while (0)
36

37
static SDnode globalDnode = {0};
38

39
SDnode *dmInstance() { return &globalDnode; }
6,822,919✔
40

41
static int32_t dmCheckRepeatInit(SDnode *pDnode) {
2,118✔
42
  int32_t code = 0;
2,118✔
43
  if (atomic_val_compare_exchange_8(&pDnode->once, DND_ENV_INIT, DND_ENV_READY) != DND_ENV_INIT) {
2,118!
44
    dError("env is already initialized");
×
45
    code = TSDB_CODE_REPEAT_INIT;
×
46
    return code;
×
47
  }
48
  return 0;
2,118✔
49
}
50

51
static int32_t dmInitSystem() {
2,118✔
52
  if (taosIgnSIGPIPE() != 0) {
2,118!
53
    dError("failed to ignore SIGPIPE");
×
54
  }
55

56
  if (taosBlockSIGPIPE() != 0) {
2,118!
57
    dError("failed to block SIGPIPE");
×
58
  }
59

60
  taosResolveCRC();
2,118✔
61
  return 0;
2,118✔
62
}
63

64
static int32_t dmInitMonitor() {
2,118✔
65
  int32_t code = 0;
2,118✔
66
  SMonCfg monCfg = {0};
2,118✔
67

68
  monCfg.maxLogs = tsMonitorMaxLogs;
2,118✔
69
  monCfg.port = tsMonitorPort;
2,118✔
70
  monCfg.server = tsMonitorFqdn;
2,118✔
71
  monCfg.comp = tsMonitorComp;
2,118✔
72
  if ((code = monInit(&monCfg)) != 0) {
2,118!
73
    dError("failed to init monitor since %s", tstrerror(code));
×
74
  }
75
  return code;
2,118✔
76
}
77

78
static int32_t dmInitAudit() {
2,118✔
79
  SAuditCfg auditCfg = {0};
2,118✔
80
  int32_t   code = 0;
2,118✔
81

82
  DM_INIT_AUDIT();
2,118!
83

84
  return 0;
2,118✔
85
}
86

87
static bool dmDataSpaceAvailable() {
2,118✔
88
  SDnode *pDnode = dmInstance();
2,118✔
89
  if (pDnode->pTfs) {
2,118!
90
    return tfsDiskSpaceAvailable(pDnode->pTfs, 0);
2,118✔
91
  }
92
  if (!osDataSpaceAvailable()) {
×
93
    dError("data disk space unavailable, i.e. %s", tsDataDir);
×
94
    return false;
×
95
  }
96
  return true;
×
97
}
98

99
static int32_t dmCheckDiskSpace() {
2,118✔
100
  // availability
101
  int32_t code = 0;
2,118✔
102
  code = osUpdate();
2,118✔
103
  if (code != 0) {
2,118!
104
    code = 0;  // ignore the error, just log it
×
105
    dError("failed to update os info since %s", tstrerror(code));
×
106
  }
107
  if (!dmDataSpaceAvailable()) {
2,118!
108
    code = TSDB_CODE_NO_DISKSPACE;
×
109
    return code;
×
110
  }
111
  if (!osLogSpaceAvailable()) {
2,118!
112
    dError("log disk space unavailable, i.e. %s", tsLogDir);
×
113
    code = TSDB_CODE_NO_DISKSPACE;
×
114
    return code;
×
115
  }
116
  if (!osTempSpaceAvailable()) {
2,118!
117
    dError("temp disk space unavailable, i.e. %s", tsTempDir);
×
118
    code = TSDB_CODE_NO_DISKSPACE;
×
119
    return code;
×
120
  }
121
  return code;
2,118✔
122
}
123

124
int32_t dmDiskInit() {
2,118✔
125
  SDnode  *pDnode = dmInstance();
2,118✔
126
  SDiskCfg dCfg = {.level = 0, .primary = 1, .disable = 0};
2,118✔
127
  tstrncpy(dCfg.dir, tsDataDir, TSDB_FILENAME_LEN);
2,118✔
128
  SDiskCfg *pDisks = tsDiskCfg;
2,118✔
129
  int32_t   numOfDisks = tsDiskCfgNum;
2,118✔
130
  if (numOfDisks <= 0 || pDisks == NULL) {
2,118!
131
    pDisks = &dCfg;
×
132
    numOfDisks = 1;
×
133
  }
134

135
  int32_t code = tfsOpen(pDisks, numOfDisks, &pDnode->pTfs);
2,118✔
136
  if (code != 0) {
2,118!
137
    dError("failed to init tfs since %s", tstrerror(code));
×
138
    TAOS_RETURN(code);
×
139
  }
140
  return 0;
2,118✔
141
}
142

143
int32_t dmDiskClose() {
2,117✔
144
  SDnode *pDnode = dmInstance();
2,117✔
145
  tfsClose(pDnode->pTfs);
2,117✔
146
  pDnode->pTfs = NULL;
2,117✔
147
  return 0;
2,117✔
148
}
149

150
static bool dmCheckDataDirVersion() {
2,118✔
151
  char checkDataDirJsonFileName[PATH_MAX] = {0};
2,118✔
152
  snprintf(checkDataDirJsonFileName, PATH_MAX, "%s/dnode/dnodeCfg.json", tsDataDir);
2,118✔
153
  if (taosCheckExistFile(checkDataDirJsonFileName)) {
2,118!
154
    dError("The default data directory %s contains old data of tdengine 2.x, please clear it before running!",
×
155
           tsDataDir);
156
    return false;
×
157
  }
158
  return true;
2,118✔
159
}
160

161
static int32_t dmCheckDataDirVersionWrapper() {
×
162
  if (!dmCheckDataDirVersion()) {
×
163
    return TSDB_CODE_INVALID_DATA_FMT;
×
164
  }
165
  return 0;
×
166
}
167

168
int32_t dmInit() {
2,118✔
169
  dInfo("start to init dnode env");
2,118!
170
  int32_t code = 0;
2,118✔
171
  if ((code = dmDiskInit()) != 0) return code;
2,118!
172
  if (!dmCheckDataDirVersion()) {
2,118!
173
    code = TSDB_CODE_INVALID_DATA_FMT;
×
174
    return code;
×
175
  }
176
  if ((code = dmCheckDiskSpace()) != 0) return code;
2,118!
177
  if ((code = dmCheckRepeatInit(dmInstance())) != 0) return code;
2,118!
178
  if ((code = dmInitSystem()) != 0) return code;
2,118!
179
  if ((code = dmInitMonitor()) != 0) return code;
2,118!
180
  if ((code = dmInitAudit()) != 0) return code;
2,118!
181
  if ((code = dmInitDnode(dmInstance())) != 0) return code;
2,118✔
182
  if ((code = InitRegexCache() != 0)) return code;
2,117!
183
#if defined(USE_S3)
184
  if ((code = tcsInit()) != 0) return code;
2,117!
185
#endif
186

187
  dInfo("dnode env is initialized");
2,117!
188
  return 0;
2,117✔
189
}
190

191
static int32_t dmCheckRepeatCleanup(SDnode *pDnode) {
2,117✔
192
  if (atomic_val_compare_exchange_8(&pDnode->once, DND_ENV_READY, DND_ENV_CLEANUP) != DND_ENV_READY) {
2,117!
193
    dError("dnode env is already cleaned up");
×
194
    return -1;
×
195
  }
196
  return 0;
2,117✔
197
}
198

199
void dmCleanup() {
2,117✔
200
  dDebug("start to cleanup dnode env");
2,117✔
201
  SDnode *pDnode = dmInstance();
2,117✔
202
  if (dmCheckRepeatCleanup(pDnode) != 0) return;
2,117!
203
  dmCleanupDnode(pDnode);
2,117✔
204
  monCleanup();
2,117✔
205
  auditCleanup();
2,117✔
206
  syncCleanUp();
2,117✔
207
  walCleanUp();
2,117✔
208
  if (udfcClose() != 0) {
2,117!
209
    dError("failed to close udfc");
×
210
  }
211
  udfStopUdfd();
2,117✔
212
  taosAnalyticsCleanup();
2,117✔
213
  taosStopCacheRefreshWorker();
2,117✔
214
  (void)dmDiskClose();
2,117✔
215
  DestroyRegexCache();
2,117✔
216

217
#if defined(USE_S3)
218
  tcsUninit();
2,117✔
219
#endif
220

221
  dInfo("dnode env is cleaned up");
2,117!
222

223
  taosCleanupCfg();
2,117✔
224
  taosCloseLog();
2,117✔
225
}
226

227
void dmStop() {
2,118✔
228
  SDnode *pDnode = dmInstance();
2,118✔
229
  pDnode->stop = true;
2,118✔
230
}
2,118✔
231

232
int32_t dmRun() {
2,117✔
233
  SDnode *pDnode = dmInstance();
2,117✔
234
  return dmRunDnode(pDnode);
2,117✔
235
}
236

237
static int32_t dmProcessCreateNodeReq(EDndNodeType ntype, SRpcMsg *pMsg) {
548✔
238
  int32_t code = 0;
548✔
239
  SDnode *pDnode = dmInstance();
548✔
240

241
  SMgmtWrapper *pWrapper = dmAcquireWrapper(pDnode, ntype);
548✔
242
  if (pWrapper != NULL) {
548!
243
    dmReleaseWrapper(pWrapper);
×
244
    switch (ntype) {
×
245
      case MNODE:
×
246
        code = TSDB_CODE_MNODE_ALREADY_DEPLOYED;
×
247
        break;
×
248
      case QNODE:
×
249
        code = TSDB_CODE_QNODE_ALREADY_DEPLOYED;
×
250
        break;
×
251
      case SNODE:
×
252
        code = TSDB_CODE_SNODE_ALREADY_DEPLOYED;
×
253
        break;
×
254
      default:
×
255
        code = TSDB_CODE_APP_ERROR;
×
256
    }
257
    dError("failed to create node since %s", tstrerror(code));
×
258
    return code;
×
259
  }
260

261
  dInfo("start to process create-node-request");
548!
262

263
  pWrapper = &pDnode->wrappers[ntype];
548✔
264
  if (taosMkDir(pWrapper->path) != 0) {
548!
265
    dmReleaseWrapper(pWrapper);
×
266
    code = terrno;
×
267
    dError("failed to create dir:%s since %s", pWrapper->path, tstrerror(code));
×
268
    return code;
×
269
  }
270

271
  (void)taosThreadMutexLock(&pDnode->mutex);
548✔
272
  SMgmtInputOpt input = dmBuildMgmtInputOpt(pWrapper);
548✔
273

274
  dInfo("node:%s, start to create", pWrapper->name);
548!
275
  code = (*pWrapper->func.createFp)(&input, pMsg);
548✔
276
  if (code != 0) {
548!
277
    dError("node:%s, failed to create since %s", pWrapper->name, tstrerror(code));
×
278
  } else {
279
    dInfo("node:%s, has been created", pWrapper->name);
548!
280
    code = dmOpenNode(pWrapper);
548✔
281
    if (code == 0) {
548!
282
      code = dmStartNode(pWrapper);
548✔
283
    }
284
    pWrapper->deployed = true;
548✔
285
    pWrapper->required = true;
548✔
286
  }
287

288
  (void)taosThreadMutexUnlock(&pDnode->mutex);
548✔
289
  return code;
548✔
290
}
291

292
static int32_t dmProcessAlterNodeTypeReq(EDndNodeType ntype, SRpcMsg *pMsg) {
1,043✔
293
  int32_t code = 0;
1,043✔
294
  SDnode *pDnode = dmInstance();
1,043✔
295

296
  SMgmtWrapper *pWrapper = dmAcquireWrapper(pDnode, ntype);
1,043✔
297
  if (pWrapper == NULL) {
1,043!
298
    dError("fail to process alter node type since node not exist");
×
299
    return TSDB_CODE_INVALID_MSG;
×
300
  }
301
  dmReleaseWrapper(pWrapper);
1,043✔
302

303
  dInfo("node:%s, start to process alter-node-type-request", pWrapper->name);
1,043!
304

305
  pWrapper = &pDnode->wrappers[ntype];
1,043✔
306

307
  if (pWrapper->func.nodeRoleFp != NULL) {
1,043!
308
    ESyncRole role = (*pWrapper->func.nodeRoleFp)(pWrapper->pMgmt);
1,043✔
309
    dInfo("node:%s, checking node role:%d", pWrapper->name, role);
1,043!
310
    if (role == TAOS_SYNC_ROLE_VOTER) {
1,043!
311
      dError("node:%s, failed to alter node type since node already is role:%d", pWrapper->name, role);
×
312
      code = TSDB_CODE_MNODE_ALREADY_IS_VOTER;
×
313
      return code;
×
314
    }
315
  }
316

317
  if (pWrapper->func.isCatchUpFp != NULL) {
1,043!
318
    dInfo("node:%s, checking node catch up", pWrapper->name);
1,043!
319
    if ((*pWrapper->func.isCatchUpFp)(pWrapper->pMgmt) != 1) {
1,043✔
320
      code = TSDB_CODE_MNODE_NOT_CATCH_UP;
951✔
321
      return code;
951✔
322
    }
323
  }
324

325
  dInfo("node:%s, catched up leader, continue to process alter-node-type-request", pWrapper->name);
92!
326

327
  (void)taosThreadMutexLock(&pDnode->mutex);
92✔
328

329
  dInfo("node:%s, stopping node", pWrapper->name);
92!
330
  dmStopNode(pWrapper);
92✔
331
  dInfo("node:%s, closing node", pWrapper->name);
92!
332
  dmCloseNode(pWrapper);
92✔
333

334
  pWrapper = &pDnode->wrappers[ntype];
92✔
335
  if (taosMkDir(pWrapper->path) != 0) {
92!
336
    (void)taosThreadMutexUnlock(&pDnode->mutex);
×
337
    code = terrno;
×
338
    dError("failed to create dir:%s since %s", pWrapper->path, tstrerror(code));
×
339
    return code;
×
340
  }
341

342
  SMgmtInputOpt input = dmBuildMgmtInputOpt(pWrapper);
92✔
343

344
  dInfo("node:%s, start to create", pWrapper->name);
92!
345
  code = (*pWrapper->func.createFp)(&input, pMsg);
92✔
346
  if (code != 0) {
92!
347
    dError("node:%s, failed to create since %s", pWrapper->name, tstrerror(code));
×
348
  } else {
349
    dInfo("node:%s, has been created", pWrapper->name);
92!
350
    code = dmOpenNode(pWrapper);
92✔
351
    if (code == 0) {
92!
352
      code = dmStartNode(pWrapper);
92✔
353
    }
354
    pWrapper->deployed = true;
92✔
355
    pWrapper->required = true;
92✔
356
  }
357

358
  (void)taosThreadMutexUnlock(&pDnode->mutex);
92✔
359
  return code;
92✔
360
}
361

362
static int32_t dmProcessDropNodeReq(EDndNodeType ntype, SRpcMsg *pMsg) {
17✔
363
  int32_t code = 0;
17✔
364
  SDnode *pDnode = dmInstance();
17✔
365

366
  SMgmtWrapper *pWrapper = dmAcquireWrapper(pDnode, ntype);
17✔
367
  if (pWrapper == NULL) {
17!
368
    switch (ntype) {
×
369
      case MNODE:
×
370
        code = TSDB_CODE_MNODE_NOT_DEPLOYED;
×
371
        break;
×
372
      case QNODE:
×
373
        code = TSDB_CODE_QNODE_NOT_DEPLOYED;
×
374
        break;
×
375
      case SNODE:
×
376
        code = TSDB_CODE_SNODE_NOT_DEPLOYED;
×
377
        break;
×
378
      default:
×
379
        code = TSDB_CODE_APP_ERROR;
×
380
    }
381

382
    dError("failed to drop node since %s", tstrerror(code));
×
383
    return terrno = code;
×
384
  }
385

386
  (void)taosThreadMutexLock(&pDnode->mutex);
17✔
387
  SMgmtInputOpt input = dmBuildMgmtInputOpt(pWrapper);
17✔
388

389
  dInfo("node:%s, start to drop", pWrapper->name);
17!
390
  code = (*pWrapper->func.dropFp)(&input, pMsg);
17✔
391
  if (code != 0) {
17!
392
    dError("node:%s, failed to drop since %s", pWrapper->name, tstrerror(code));
×
393
  } else {
394
    dInfo("node:%s, has been dropped", pWrapper->name);
17!
395
    pWrapper->required = false;
17✔
396
    pWrapper->deployed = false;
17✔
397
  }
398

399
  dmReleaseWrapper(pWrapper);
17✔
400

401
  if (code == 0) {
17!
402
    dmStopNode(pWrapper);
17✔
403
    dmCloseNode(pWrapper);
17✔
404
    taosRemoveDir(pWrapper->path);
17✔
405
  }
406
  (void)taosThreadMutexUnlock(&pDnode->mutex);
17✔
407
  return code;
17✔
408
}
409

410
SMgmtInputOpt dmBuildMgmtInputOpt(SMgmtWrapper *pWrapper) {
17,688✔
411
  SMgmtInputOpt opt = {
17,688✔
412
      .path = pWrapper->path,
17,688✔
413
      .name = pWrapper->name,
17,688✔
414
      .pTfs = pWrapper->pDnode->pTfs,
17,688✔
415
      .pData = &pWrapper->pDnode->data,
17,688✔
416
      .processCreateNodeFp = dmProcessCreateNodeReq,
417
      .processAlterNodeTypeFp = dmProcessAlterNodeTypeReq,
418
      .processDropNodeFp = dmProcessDropNodeReq,
419
      .sendMonitorReportFp = dmSendMonitorReport,
420
      .monitorCleanExpiredSamplesFp = dmMonitorCleanExpiredSamples,
421
      .sendAuditRecordFp = auditSendRecordsInBatch,
422
      .getVnodeLoadsFp = dmGetVnodeLoads,
423
      .getVnodeLoadsLiteFp = dmGetVnodeLoadsLite,
424
      .getMnodeLoadsFp = dmGetMnodeLoads,
425
      .getQnodeLoadsFp = dmGetQnodeLoads,
426
      .stopDnodeFp = dmStop,
427
  };
428

429
  opt.msgCb = dmGetMsgcb(pWrapper->pDnode);
17,688✔
430
  return opt;
17,688✔
431
}
432

433
void dmReportStartup(const char *pName, const char *pDesc) {
113,774✔
434
  SStartupInfo *pStartup = &(dmInstance()->startup);
113,774✔
435
  tstrncpy(pStartup->name, pName, TSDB_STEP_NAME_LEN);
113,774✔
436
  tstrncpy(pStartup->desc, pDesc, TSDB_STEP_DESC_LEN);
113,774✔
437
  dDebug("step:%s, %s", pStartup->name, pStartup->desc);
113,774✔
438
}
113,773✔
439

440
int64_t dmGetClusterId() { return globalDnode.data.clusterId; }
×
441

442
bool dmReadyForTest() { return dmInstance()->data.dnodeVer > 0; }
×
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc