• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #4732

12 Sep 2025 02:34AM UTC coverage: 59.006% (+0.2%) from 58.768%
#4732

push

travis-ci

web-flow
docs: optimize taosd config parameters doc better (#32964)

136080 of 292959 branches covered (46.45%)

Branch coverage included in aggregate %.

204691 of 284559 relevant lines covered (71.93%)

25330922.01 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

78.51
/source/dnode/vnode/src/tsdb/tsdbMemTable.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15

16
#include "tsdb.h"
17
#include "util/tsimplehash.h"
18

19
#define MEM_MIN_HASH 1024
20
#define SL_MAX_LEVEL 5
21

22
// sizeof(SMemSkipListNode) + sizeof(SMemSkipListNode *) * (l) * 2
23
#define SL_NODE_SIZE(l)               (sizeof(SMemSkipListNode) + ((l) << 4))
24
#define SL_NODE_FORWARD(n, l)         ((n)->forwards[l])
25
#define SL_NODE_BACKWARD(n, l)        ((n)->forwards[(n)->level + (l)])
26
#define SL_GET_NODE_FORWARD(n, l)     ((SMemSkipListNode *)atomic_load_ptr(&SL_NODE_FORWARD(n, l)))
27
#define SL_GET_NODE_BACKWARD(n, l)    ((SMemSkipListNode *)atomic_load_ptr(&SL_NODE_BACKWARD(n, l)))
28
#define SL_SET_NODE_FORWARD(n, l, p)  atomic_store_ptr(&SL_NODE_FORWARD(n, l), p)
29
#define SL_SET_NODE_BACKWARD(n, l, p) atomic_store_ptr(&SL_NODE_BACKWARD(n, l), p)
30

31
#define SL_MOVE_BACKWARD 0x1
32
#define SL_MOVE_FROM_POS 0x2
33

34
static void    tbDataMovePosTo(STbData *pTbData, SMemSkipListNode **pos, STsdbRowKey *pKey, int32_t flags);
35
static int32_t tsdbGetOrCreateTbData(SMemTable *pMemTable, tb_uid_t suid, tb_uid_t uid, STbData **ppTbData);
36
static int32_t tsdbInsertRowDataToTable(SMemTable *pMemTable, STbData *pTbData, int64_t version,
37
                                        SSubmitTbData *pSubmitTbData, int32_t *affectedRows);
38
static int32_t tsdbInsertColDataToTable(SMemTable *pMemTable, STbData *pTbData, int64_t version,
39
                                        SSubmitTbData *pSubmitTbData, int32_t *affectedRows);
40

41
static int32_t tTbDataCmprFn(const SRBTreeNode *n1, const SRBTreeNode *n2) {
3,274,038✔
42
  STbData *tbData1 = TCONTAINER_OF(n1, STbData, rbtn);
3,274,038✔
43
  STbData *tbData2 = TCONTAINER_OF(n2, STbData, rbtn);
3,274,038✔
44
  if (tbData1->suid < tbData2->suid) return -1;
3,274,038✔
45
  if (tbData1->suid > tbData2->suid) return 1;
3,064,219✔
46
  if (tbData1->uid < tbData2->uid) return -1;
3,019,345✔
47
  if (tbData1->uid > tbData2->uid) return 1;
2,417,241!
48
  return 0;
×
49
}
50

51
int32_t tsdbMemTableCreate(STsdb *pTsdb, SMemTable **ppMemTable) {
47,383✔
52
  int32_t    code = 0;
47,383✔
53
  SMemTable *pMemTable = NULL;
47,383✔
54

55
  pMemTable = (SMemTable *)taosMemoryCalloc(1, sizeof(*pMemTable));
47,383!
56
  if (pMemTable == NULL) {
47,392!
57
    code = terrno;
×
58
    goto _err;
×
59
  }
60
  taosInitRWLatch(&pMemTable->latch);
47,392✔
61
  pMemTable->pTsdb = pTsdb;
47,388✔
62
  pMemTable->pPool = pTsdb->pVnode->inUse;
47,388✔
63
  pMemTable->nRef = 1;
47,388✔
64
  pMemTable->minVer = VERSION_MAX;
47,388✔
65
  pMemTable->maxVer = VERSION_MIN;
47,388✔
66
  pMemTable->minKey = TSKEY_MAX;
47,388✔
67
  pMemTable->maxKey = TSKEY_MIN;
47,388✔
68
  pMemTable->nRow = 0;
47,388✔
69
  pMemTable->nDel = 0;
47,388✔
70
  pMemTable->nTbData = 0;
47,388✔
71
  pMemTable->nBucket = MEM_MIN_HASH;
47,388✔
72
  pMemTable->aBucket = (STbData **)taosMemoryCalloc(pMemTable->nBucket, sizeof(STbData *));
47,388!
73
  if (pMemTable->aBucket == NULL) {
47,389!
74
    code = terrno;
×
75
    taosMemoryFree(pMemTable);
×
76
    goto _err;
×
77
  }
78
  vnodeBufPoolRef(pMemTable->pPool);
47,389✔
79
  tRBTreeCreate(pMemTable->tbDataTree, tTbDataCmprFn);
47,392✔
80

81
  *ppMemTable = pMemTable;
47,396✔
82
  return code;
47,396✔
83

84
_err:
×
85
  *ppMemTable = NULL;
×
86
  return code;
×
87
}
88

89
void tsdbMemTableDestroy(SMemTable *pMemTable, bool proactive) {
47,397✔
90
  if (pMemTable) {
47,397!
91
    vnodeBufPoolUnRef(pMemTable->pPool, proactive);
47,397✔
92
    taosMemoryFree(pMemTable->aBucket);
47,397!
93
    taosMemoryFree(pMemTable);
47,397!
94
  }
95
}
47,396✔
96

97
static FORCE_INLINE STbData *tsdbGetTbDataFromMemTableImpl(SMemTable *pMemTable, tb_uid_t suid, tb_uid_t uid) {
98
  STbData *pTbData = pMemTable->aBucket[TABS(uid) % pMemTable->nBucket];
53,656,938✔
99

100
  while (pTbData) {
53,712,593✔
101
    if (pTbData->uid == uid) break;
34,280,411✔
102
    pTbData = pTbData->next;
55,655✔
103
  }
104

105
  return pTbData;
53,656,938✔
106
}
107

108
STbData *tsdbGetTbDataFromMemTable(SMemTable *pMemTable, tb_uid_t suid, tb_uid_t uid) {
29,284,955✔
109
  STbData *pTbData;
110

111
  taosRLockLatch(&pMemTable->latch);
29,284,955✔
112
  pTbData = tsdbGetTbDataFromMemTableImpl(pMemTable, suid, uid);
29,308,983✔
113
  taosRUnLockLatch(&pMemTable->latch);
29,308,983✔
114

115
  return pTbData;
29,308,648✔
116
}
117

118
int32_t tsdbInsertTableData(STsdb *pTsdb, int64_t version, SSubmitTbData *pSubmitTbData, int32_t *affectedRows) {
24,223,845✔
119
  int32_t    code = 0;
24,223,845✔
120
  SMemTable *pMemTable = pTsdb->mem;
24,223,845✔
121
  STbData   *pTbData = NULL;
24,223,845✔
122
  tb_uid_t   suid = pSubmitTbData->suid;
24,223,845✔
123
  tb_uid_t   uid = pSubmitTbData->uid;
24,223,845✔
124

125
  if (tsBypassFlag & TSDB_BYPASS_RB_TSDB_WRITE_MEM) {
24,223,845✔
126
    goto _err;
2✔
127
  }
128

129
  // create/get STbData to op
130
  code = tsdbGetOrCreateTbData(pMemTable, suid, uid, &pTbData);
24,223,843✔
131
  if (code) {
24,224,096!
132
    goto _err;
×
133
  }
134

135
  // do insert impl
136
  if (pSubmitTbData->flags & SUBMIT_REQ_COLUMN_DATA_FORMAT) {
24,224,096✔
137
    code = tsdbInsertColDataToTable(pMemTable, pTbData, version, pSubmitTbData, affectedRows);
1,156✔
138
  } else {
139
    code = tsdbInsertRowDataToTable(pMemTable, pTbData, version, pSubmitTbData, affectedRows);
24,222,940✔
140
  }
141
  if (code) goto _err;
24,224,119!
142

143
  // update
144
  pMemTable->minVer = TMIN(pMemTable->minVer, version);
24,224,119✔
145
  pMemTable->maxVer = TMAX(pMemTable->maxVer, version);
24,224,119✔
146

147
  return code;
24,224,119✔
148

149
_err:
2✔
150
  terrno = code;
2✔
151
  return code;
2✔
152
}
153

154
int32_t tsdbDeleteTableData(STsdb *pTsdb, int64_t version, tb_uid_t suid, tb_uid_t uid, TSKEY sKey, TSKEY eKey) {
124,052✔
155
  int32_t    code = 0;
124,052✔
156
  SMemTable *pMemTable = pTsdb->mem;
124,052✔
157
  STbData   *pTbData = NULL;
124,052✔
158
  SVBufPool *pPool = pTsdb->pVnode->inUse;
124,052✔
159

160
  // check if table exists
161
  SMetaInfo info;
162
  code = metaGetInfo(pTsdb->pVnode->pMeta, uid, &info, NULL);
124,052✔
163
  if (code) {
124,054!
164
    code = TSDB_CODE_TDB_TABLE_NOT_EXIST;
×
165
    goto _err;
×
166
  }
167
  if (info.suid != suid) {
124,054!
168
    code = TSDB_CODE_INVALID_MSG;
×
169
    goto _err;
×
170
  }
171

172
  code = tsdbGetOrCreateTbData(pMemTable, suid, uid, &pTbData);
124,054✔
173
  if (code) {
124,054!
174
    goto _err;
×
175
  }
176

177
  // do delete
178
  SDelData *pDelData = (SDelData *)vnodeBufPoolMalloc(pPool, sizeof(*pDelData));
124,054✔
179
  if (pDelData == NULL) {
124,054!
180
    code = terrno;
×
181
    goto _err;
×
182
  }
183
  pDelData->version = version;
124,054✔
184
  pDelData->sKey = sKey;
124,054✔
185
  pDelData->eKey = eKey;
124,054✔
186
  pDelData->pNext = NULL;
124,054✔
187
  taosWLockLatch(&pTbData->lock);
124,054✔
188
  if (pTbData->pHead == NULL) {
124,053✔
189
    pTbData->pHead = pTbData->pTail = pDelData;
38,691✔
190
  } else {
191
    pTbData->pTail->pNext = pDelData;
85,362✔
192
    pTbData->pTail = pDelData;
85,362✔
193
  }
194
  taosWUnLockLatch(&pTbData->lock);
124,053✔
195

196
  pMemTable->nDel++;
124,057✔
197
  pMemTable->minVer = TMIN(pMemTable->minVer, version);
124,057✔
198
  pMemTable->maxVer = TMAX(pMemTable->maxVer, version);
124,057✔
199

200
  if (tsdbCacheDel(pTsdb, suid, uid, sKey, eKey) != 0) {
124,057!
201
    tsdbError("vgId:%d, failed to delete cache data from table suid:%" PRId64 " uid:%" PRId64 " skey:%" PRId64
×
202
              " eKey:%" PRId64 " at version %" PRId64,
203
              TD_VID(pTsdb->pVnode), suid, uid, sKey, eKey, version);
204
  }
205

206
  tsdbTrace("vgId:%d, delete data from table suid:%" PRId64 " uid:%" PRId64 " skey:%" PRId64 " eKey:%" PRId64
124,054✔
207
            " at version %" PRId64,
208
            TD_VID(pTsdb->pVnode), suid, uid, sKey, eKey, version);
209
  return code;
124,052✔
210

211
_err:
×
212
  tsdbError("vgId:%d, failed to delete data from table suid:%" PRId64 " uid:%" PRId64 " skey:%" PRId64 " eKey:%" PRId64
×
213
            " at version %" PRId64 " since %s",
214
            TD_VID(pTsdb->pVnode), suid, uid, sKey, eKey, version, tstrerror(code));
215
  return code;
×
216
}
217

218
int32_t tsdbTbDataIterCreate(STbData *pTbData, STsdbRowKey *pFrom, int8_t backward, STbDataIter **ppIter) {
7,020,798✔
219
  int32_t code = 0;
7,020,798✔
220

221
  (*ppIter) = (STbDataIter *)taosMemoryCalloc(1, sizeof(STbDataIter));
7,020,798!
222
  if ((*ppIter) == NULL) {
7,020,826!
223
    code = terrno;
×
224
    goto _exit;
×
225
  }
226

227
  tsdbTbDataIterOpen(pTbData, pFrom, backward, *ppIter);
7,020,826✔
228

229
_exit:
7,019,378✔
230
  return code;
7,019,378✔
231
}
232

233
void *tsdbTbDataIterDestroy(STbDataIter *pIter) {
7,020,348✔
234
  if (pIter) {
7,020,348!
235
    taosMemoryFree(pIter);
7,020,388!
236
  }
237
  return NULL;
7,021,835✔
238
}
239

240
void tsdbTbDataIterOpen(STbData *pTbData, STsdbRowKey *pFrom, int8_t backward, STbDataIter *pIter) {
7,836,810✔
241
  SMemSkipListNode *pos[SL_MAX_LEVEL];
242
  SMemSkipListNode *pHead;
243
  SMemSkipListNode *pTail;
244

245
  pHead = pTbData->sl.pHead;
7,836,810✔
246
  pTail = pTbData->sl.pTail;
7,836,810✔
247
  pIter->pTbData = pTbData;
7,836,810✔
248
  pIter->backward = backward;
7,836,810✔
249
  pIter->pRow = NULL;
7,836,810✔
250
  if (pFrom == NULL) {
7,836,810✔
251
    // create from head or tail
252
    if (backward) {
14,089✔
253
      pIter->pNode = SL_GET_NODE_BACKWARD(pTbData->sl.pTail, 0);
14,088✔
254
    } else {
255
      pIter->pNode = SL_GET_NODE_FORWARD(pTbData->sl.pHead, 0);
1✔
256
    }
257
  } else {
258
    // create from a key
259
    if (backward) {
7,822,721✔
260
      tbDataMovePosTo(pTbData, pos, pFrom, SL_MOVE_BACKWARD);
1,320,860✔
261
      pIter->pNode = SL_GET_NODE_BACKWARD(pos[0], 0);
1,321,032✔
262
    } else {
263
      tbDataMovePosTo(pTbData, pos, pFrom, 0);
6,501,861✔
264
      pIter->pNode = SL_GET_NODE_FORWARD(pos[0], 0);
6,497,652✔
265
    }
266
  }
267
}
7,832,124✔
268

269
bool tsdbTbDataIterNext(STbDataIter *pIter) {
2,147,483,647✔
270
  pIter->pRow = NULL;
2,147,483,647✔
271
  if (pIter->backward) {
2,147,483,647✔
272
    if (pIter->pNode == pIter->pTbData->sl.pHead) {
187,658,086!
273
      return false;
×
274
    }
275

276
    pIter->pNode = SL_GET_NODE_BACKWARD(pIter->pNode, 0);
187,658,086✔
277
    if (pIter->pNode == pIter->pTbData->sl.pHead) {
187,489,842✔
278
      return false;
488,600✔
279
    }
280
  } else {
281
    if (pIter->pNode == pIter->pTbData->sl.pTail) {
2,147,483,647!
282
      return false;
×
283
    }
284

285
    pIter->pNode = SL_GET_NODE_FORWARD(pIter->pNode, 0);
2,147,483,647✔
286
    if (pIter->pNode == pIter->pTbData->sl.pTail) {
2,147,483,647✔
287
      return false;
3,814,547✔
288
    }
289
  }
290

291
  return true;
2,147,483,647✔
292
}
293

294
int64_t tsdbCountTbDataRows(STbData *pTbData) {
×
295
  SMemSkipListNode *pNode = pTbData->sl.pHead;
×
296
  int64_t           rowsNum = 0;
×
297

298
  while (NULL != pNode) {
×
299
    pNode = SL_GET_NODE_FORWARD(pNode, 0);
×
300
    if (pNode == pTbData->sl.pTail) {
×
301
      return rowsNum;
×
302
    }
303

304
    rowsNum++;
×
305
  }
306

307
  return rowsNum;
×
308
}
309

310
void tsdbMemTableCountRows(SMemTable *pMemTable, SSHashObj *pTableMap, int64_t *rowsNum) {
×
311
  taosRLockLatch(&pMemTable->latch);
×
312
  for (int32_t i = 0; i < pMemTable->nBucket; ++i) {
×
313
    STbData *pTbData = pMemTable->aBucket[i];
×
314
    while (pTbData) {
×
315
      void *p = tSimpleHashGet(pTableMap, &pTbData->uid, sizeof(pTbData->uid));
×
316
      if (p == NULL) {
×
317
        pTbData = pTbData->next;
×
318
        continue;
×
319
      }
320

321
      *rowsNum += tsdbCountTbDataRows(pTbData);
×
322
      pTbData = pTbData->next;
×
323
    }
324
  }
325
  taosRUnLockLatch(&pMemTable->latch);
×
326
}
×
327

328
typedef int32_t (*__tsdb_cache_update)(SMemTable *imem, int64_t suid, int64_t uid);
329

330
int32_t tsdbMemTableSaveToCache(SMemTable *pMemTable, void *func) {
657✔
331
  int32_t             code = 0;
657✔
332
  __tsdb_cache_update cb = (__tsdb_cache_update)func;
657✔
333

334
  for (int32_t i = 0; i < pMemTable->nBucket; ++i) {
673,425✔
335
    STbData *pTbData = pMemTable->aBucket[i];
672,768✔
336
    while (pTbData) {
678,135✔
337
      code = (*cb)(pMemTable, pTbData->suid, pTbData->uid);
5,367✔
338
      if (code) {
5,367!
339
        TAOS_RETURN(code);
×
340
      }
341

342
      pTbData = pTbData->next;
5,367✔
343
    }
344
  }
345

346
  return code;
657✔
347
}
348

349
static int32_t tsdbMemTableRehash(SMemTable *pMemTable) {
28✔
350
  int32_t code = 0;
28✔
351

352
  int32_t   nBucket = pMemTable->nBucket * 2;
28✔
353
  STbData **aBucket = (STbData **)taosMemoryCalloc(nBucket, sizeof(STbData *));
28!
354
  if (aBucket == NULL) {
28!
355
    code = terrno;
×
356
    goto _exit;
×
357
  }
358

359
  for (int32_t iBucket = 0; iBucket < pMemTable->nBucket; iBucket++) {
89,116✔
360
    STbData *pTbData = pMemTable->aBucket[iBucket];
89,088✔
361

362
    while (pTbData) {
178,176✔
363
      STbData *pNext = pTbData->next;
89,088✔
364

365
      int32_t idx = TABS(pTbData->uid) % nBucket;
89,088✔
366
      pTbData->next = aBucket[idx];
89,088✔
367
      aBucket[idx] = pTbData;
89,088✔
368

369
      pTbData = pNext;
89,088✔
370
    }
371
  }
372

373
  taosMemoryFree(pMemTable->aBucket);
28!
374
  pMemTable->nBucket = nBucket;
28✔
375
  pMemTable->aBucket = aBucket;
28✔
376

377
_exit:
28✔
378
  return code;
28✔
379
}
380

381
static int32_t tsdbGetOrCreateTbData(SMemTable *pMemTable, tb_uid_t suid, tb_uid_t uid, STbData **ppTbData) {
24,347,955✔
382
  int32_t code = 0;
24,347,955✔
383

384
  // get
385
  STbData *pTbData = tsdbGetTbDataFromMemTableImpl(pMemTable, suid, uid);
24,347,955✔
386
  if (pTbData) goto _exit;
24,347,955✔
387

388
  // create
389
  SVBufPool *pPool = pMemTable->pTsdb->pVnode->inUse;
260,486✔
390
  int8_t     maxLevel = pMemTable->pTsdb->pVnode->config.tsdbCfg.slLevel;
260,486✔
391

392
  pTbData = vnodeBufPoolMallocAligned(pPool, sizeof(*pTbData) + SL_NODE_SIZE(maxLevel) * 2);
260,486✔
393
  if (pTbData == NULL) {
260,694!
394
    code = terrno;
×
395
    goto _exit;
×
396
  }
397
  pTbData->suid = suid;
260,694✔
398
  pTbData->uid = uid;
260,694✔
399
  pTbData->minKey = TSKEY_MAX;
260,694✔
400
  pTbData->maxKey = TSKEY_MIN;
260,694✔
401
  pTbData->pHead = NULL;
260,694✔
402
  pTbData->pTail = NULL;
260,694✔
403
  pTbData->sl.seed = taosRand();
260,694✔
404
  pTbData->sl.size = 0;
260,696✔
405
  pTbData->sl.maxLevel = maxLevel;
260,696✔
406
  pTbData->sl.level = 0;
260,696✔
407
  pTbData->sl.pHead = (SMemSkipListNode *)&pTbData[1];
260,696✔
408
  pTbData->sl.pTail = (SMemSkipListNode *)POINTER_SHIFT(pTbData->sl.pHead, SL_NODE_SIZE(maxLevel));
260,696✔
409
  pTbData->sl.pHead->level = maxLevel;
260,696✔
410
  pTbData->sl.pTail->level = maxLevel;
260,696✔
411
  for (int8_t iLevel = 0; iLevel < maxLevel; iLevel++) {
1,564,168✔
412
    SL_NODE_FORWARD(pTbData->sl.pHead, iLevel) = pTbData->sl.pTail;
1,303,472✔
413
    SL_NODE_BACKWARD(pTbData->sl.pTail, iLevel) = pTbData->sl.pHead;
1,303,472✔
414

415
    SL_NODE_BACKWARD(pTbData->sl.pHead, iLevel) = NULL;
1,303,472✔
416
    SL_NODE_FORWARD(pTbData->sl.pTail, iLevel) = NULL;
1,303,472✔
417
  }
418
  taosInitRWLatch(&pTbData->lock);
260,696✔
419

420
  taosWLockLatch(&pMemTable->latch);
260,696✔
421

422
  if (pMemTable->nTbData >= pMemTable->nBucket) {
260,696✔
423
    code = tsdbMemTableRehash(pMemTable);
28✔
424
    if (code) {
28!
425
      taosWUnLockLatch(&pMemTable->latch);
×
426
      goto _exit;
×
427
    }
428
  }
429

430
  int32_t idx = TABS(uid) % pMemTable->nBucket;
260,696✔
431
  pTbData->next = pMemTable->aBucket[idx];
260,696✔
432
  pMemTable->aBucket[idx] = pTbData;
260,696✔
433
  pMemTable->nTbData++;
260,696✔
434

435
  if (tRBTreePut(pMemTable->tbDataTree, pTbData->rbtn) == NULL) {
260,696!
436
    taosWUnLockLatch(&pMemTable->latch);
×
437
    code = TSDB_CODE_INTERNAL_ERROR;
×
438
    goto _exit;
×
439
  }
440

441
  taosWUnLockLatch(&pMemTable->latch);
260,695✔
442

443
_exit:
24,348,160✔
444
  if (code) {
24,348,160!
445
    *ppTbData = NULL;
×
446
  } else {
447
    *ppTbData = pTbData;
24,348,160✔
448
  }
449
  return code;
24,348,160✔
450
}
451

452
static void tbDataMovePosTo(STbData *pTbData, SMemSkipListNode **pos, STsdbRowKey *pKey, int32_t flags) {
75,866,756✔
453
  SMemSkipListNode *px;
454
  SMemSkipListNode *pn;
455
  STsdbRowKey       tKey;
456
  int32_t           backward = flags & SL_MOVE_BACKWARD;
75,866,756✔
457
  int32_t           fromPos = flags & SL_MOVE_FROM_POS;
75,866,756✔
458

459
  if (backward) {
75,866,756✔
460
    px = pTbData->sl.pTail;
25,545,048✔
461

462
    if (!fromPos) {
25,545,048!
463
      for (int8_t iLevel = pTbData->sl.level; iLevel < pTbData->sl.maxLevel; iLevel++) {
33,235,929✔
464
        pos[iLevel] = px;
7,690,792✔
465
      }
466
    }
467

468
    if (pTbData->sl.level) {
25,545,048✔
469
      if (fromPos) px = pos[pTbData->sl.level - 1];
25,290,605!
470

471
      for (int8_t iLevel = pTbData->sl.level - 1; iLevel >= 0; iLevel--) {
145,320,380✔
472
        pn = SL_GET_NODE_BACKWARD(px, iLevel);
120,030,413✔
473
        while (pn != pTbData->sl.pHead) {
134,983,306✔
474
          tsdbRowGetKey(&pn->row, &tKey);
133,211,594✔
475

476
          int32_t c = tsdbRowKeyCmpr(&tKey, pKey);
133,216,600✔
477
          if (c <= 0) {
133,222,155✔
478
            break;
118,258,063✔
479
          } else {
480
            px = pn;
14,964,092✔
481
            pn = SL_GET_NODE_BACKWARD(px, iLevel);
14,964,092✔
482
          }
483
        }
484

485
        pos[iLevel] = px;
120,029,775✔
486
      }
487
    }
488
  } else {
489
    px = pTbData->sl.pHead;
50,321,708✔
490

491
    if (!fromPos) {
50,321,708✔
492
      for (int8_t iLevel = pTbData->sl.level; iLevel < pTbData->sl.maxLevel; iLevel++) {
12,532,856✔
493
        pos[iLevel] = px;
6,031,049✔
494
      }
495
    }
496

497
    if (pTbData->sl.level) {
50,321,708✔
498
      if (fromPos) px = pos[pTbData->sl.level - 1];
50,296,355✔
499

500
      for (int8_t iLevel = pTbData->sl.level - 1; iLevel >= 0; iLevel--) {
295,392,760✔
501
        pn = SL_GET_NODE_FORWARD(px, iLevel);
245,091,605✔
502
        while (pn != pTbData->sl.pTail) {
775,257,658✔
503
          tsdbRowGetKey(&pn->row, &tKey);
768,038,879✔
504

505
          int32_t c = tsdbRowKeyCmpr(&tKey, pKey);
769,046,360✔
506
          if (c >= 0) {
769,666,480✔
507
            break;
237,877,626✔
508
          } else {
509
            px = pn;
531,788,854✔
510
            pn = SL_GET_NODE_FORWARD(px, iLevel);
531,788,854✔
511
          }
512
        }
513

514
        pos[iLevel] = px;
245,096,405✔
515
      }
516
    }
517
  }
518
}
75,870,918✔
519

520
static FORCE_INLINE int8_t tsdbMemSkipListRandLevel(SMemSkipList *pSl) {
521
  int8_t level = 1;
1,474,173,399✔
522
  int8_t tlevel = TMIN(pSl->maxLevel, pSl->level + 1);
1,474,173,399✔
523

524
  while ((taosRandR(&pSl->seed) & 0x3) == 0 && level < tlevel) {
1,963,473,077✔
525
    level++;
489,299,678✔
526
  }
527

528
  return level;
1,473,818,602✔
529
}
530
static int32_t tbDataDoPut(SMemTable *pMemTable, STbData *pTbData, SMemSkipListNode **pos, TSDBROW *pRow,
1,474,173,399✔
531
                           int8_t forward) {
532
  int32_t           code = 0;
1,474,173,399✔
533
  int8_t            level;
534
  SMemSkipListNode *pNode = NULL;
1,474,173,399✔
535
  SVBufPool        *pPool = pMemTable->pTsdb->pVnode->inUse;
1,474,173,399✔
536
  int64_t           nSize;
537

538
  // create node
539
  level = tsdbMemSkipListRandLevel(&pTbData->sl);
1,474,173,399✔
540
  nSize = SL_NODE_SIZE(level);
1,473,818,602✔
541
  if (pRow->type == TSDBROW_ROW_FMT) {
1,473,818,602!
542
    pNode = (SMemSkipListNode *)vnodeBufPoolMallocAligned(pPool, nSize + pRow->pTSRow->len);
1,473,821,239✔
543
  } else if (pRow->type == TSDBROW_COL_FMT) {
×
544
    pNode = (SMemSkipListNode *)vnodeBufPoolMallocAligned(pPool, nSize);
72,867✔
545
  }
546
  if (pNode == NULL) {
1,473,806,124!
547
    code = terrno;
×
548
    goto _exit;
×
549
  }
550

551
  pNode->level = level;
1,473,806,124✔
552
  pNode->row = *pRow;
1,473,806,124✔
553
  if (pRow->type == TSDBROW_ROW_FMT) {
1,473,806,124✔
554
    pNode->row.pTSRow = (SRow *)((char *)pNode + nSize);
1,473,730,532✔
555
    memcpy(pNode->row.pTSRow, pRow->pTSRow, pRow->pTSRow->len);
1,473,730,532✔
556
  }
557

558
  // set node
559
  if (forward) {
1,473,806,124✔
560
    for (int8_t iLevel = 0; iLevel < level; iLevel++) {
2,147,483,647✔
561
      SL_NODE_FORWARD(pNode, iLevel) = SL_NODE_FORWARD(pos[iLevel], iLevel);
1,930,825,030✔
562
      SL_NODE_BACKWARD(pNode, iLevel) = pos[iLevel];
1,930,825,030✔
563
    }
564
  } else {
565
    for (int8_t iLevel = 0; iLevel < level; iLevel++) {
56,154,141✔
566
      SL_NODE_FORWARD(pNode, iLevel) = pos[iLevel];
32,162,165✔
567
      SL_NODE_BACKWARD(pNode, iLevel) = SL_NODE_BACKWARD(pos[iLevel], iLevel);
32,162,165✔
568
    }
569
  }
570

571
  // set forward and backward
572
  if (forward) {
1,473,806,124✔
573
    for (int8_t iLevel = level - 1; iLevel >= 0; iLevel--) {
2,147,483,647✔
574
      SMemSkipListNode *pNext = pos[iLevel]->forwards[iLevel];
1,931,013,899✔
575

576
      SL_SET_NODE_FORWARD(pos[iLevel], iLevel, pNode);
1,931,013,899✔
577
      SL_SET_NODE_BACKWARD(pNext, iLevel, pNode);
1,931,552,932✔
578

579
      pos[iLevel] = pNode;
1,931,497,465✔
580
    }
581
  } else {
582
    for (int8_t iLevel = level - 1; iLevel >= 0; iLevel--) {
56,382,766✔
583
      SMemSkipListNode *pPrev = pos[iLevel]->forwards[pos[iLevel]->level + iLevel];
32,162,247✔
584

585
      SL_SET_NODE_FORWARD(pPrev, iLevel, pNode);
32,162,247✔
586
      SL_SET_NODE_BACKWARD(pos[iLevel], iLevel, pNode);
32,162,575✔
587

588
      pos[iLevel] = pNode;
32,398,066✔
589
    }
590
  }
591

592
  pTbData->sl.size++;
1,474,525,509✔
593
  if (pTbData->sl.level < pNode->level) {
1,474,525,509✔
594
    pTbData->sl.level = pNode->level;
840,027✔
595
  }
596

597
_exit:
1,473,685,482✔
598
  return code;
1,474,525,509✔
599
}
600

601
static int32_t tsdbInsertColDataToTable(SMemTable *pMemTable, STbData *pTbData, int64_t version,
1,156✔
602
                                        SSubmitTbData *pSubmitTbData, int32_t *affectedRows) {
603
  int32_t code = 0;
1,156✔
604

605
  SVBufPool *pPool = pMemTable->pTsdb->pVnode->inUse;
1,156✔
606
  int32_t    nColData = TARRAY_SIZE(pSubmitTbData->aCol);
1,156✔
607
  SColData  *aColData = (SColData *)TARRAY_DATA(pSubmitTbData->aCol);
1,156✔
608

609
  // copy and construct block data
610
  SBlockData *pBlockData = vnodeBufPoolMalloc(pPool, sizeof(*pBlockData));
1,156✔
611
  if (pBlockData == NULL) {
1,156!
612
    code = terrno;
×
613
    goto _exit;
×
614
  }
615

616
  pBlockData->suid = pTbData->suid;
1,156✔
617
  pBlockData->uid = pTbData->uid;
1,156✔
618
  pBlockData->nRow = aColData[0].nVal;
1,156✔
619
  pBlockData->aUid = NULL;
1,156✔
620
  pBlockData->aVersion = vnodeBufPoolMalloc(pPool, aColData[0].nData);
1,156✔
621
  if (pBlockData->aVersion == NULL) {
1,156!
622
    code = terrno;
×
623
    goto _exit;
×
624
  }
625
  for (int32_t i = 0; i < pBlockData->nRow; i++) {  // todo: here can be optimized
74,523✔
626
    pBlockData->aVersion[i] = version;
73,367✔
627
  }
628

629
  pBlockData->aTSKEY = vnodeBufPoolMalloc(pPool, aColData[0].nData);
1,156✔
630
  if (pBlockData->aTSKEY == NULL) {
1,156!
631
    code = terrno;
×
632
    goto _exit;
×
633
  }
634
  memcpy(pBlockData->aTSKEY, aColData[0].pData, aColData[0].nData);
1,156✔
635

636
  pBlockData->nColData = nColData - 1;
1,156✔
637
  pBlockData->aColData = vnodeBufPoolMalloc(pPool, sizeof(SColData) * pBlockData->nColData);
1,156✔
638
  if (pBlockData->aColData == NULL) {
1,156!
639
    code = terrno;
×
640
    goto _exit;
×
641
  }
642

643
  for (int32_t iColData = 0; iColData < pBlockData->nColData; ++iColData) {
7,291✔
644
    code = tColDataCopy(&aColData[iColData + 1], &pBlockData->aColData[iColData], (xMallocFn)vnodeBufPoolMalloc, pPool);
6,135✔
645
    if (code) goto _exit;
6,135!
646
  }
647

648
  // loop to add each row to the skiplist
649
  SMemSkipListNode *pos[SL_MAX_LEVEL];
650
  TSDBROW           tRow = tsdbRowFromBlockData(pBlockData, 0);
1,156✔
651
  STsdbRowKey       key;
652

653
  // first row
654
  tsdbRowGetKey(&tRow, &key);
1,156✔
655
  tbDataMovePosTo(pTbData, pos, &key, SL_MOVE_BACKWARD);
1,155✔
656
  if ((code = tbDataDoPut(pMemTable, pTbData, pos, &tRow, 0))) goto _exit;
1,156!
657
  pTbData->minKey = TMIN(pTbData->minKey, key.key.ts);
1,156✔
658

659
  // remain row
660
  ++tRow.iRow;
1,156✔
661
  if (tRow.iRow < pBlockData->nRow) {
1,156✔
662
    for (int8_t iLevel = pos[0]->level; iLevel < pTbData->sl.maxLevel; iLevel++) {
4,944✔
663
      pos[iLevel] = SL_NODE_BACKWARD(pos[iLevel], iLevel);
3,944✔
664
    }
665

666
    while (tRow.iRow < pBlockData->nRow) {
73,009✔
667
      tsdbRowGetKey(&tRow, &key);
72,007✔
668

669
      if (SL_NODE_FORWARD(pos[0], 0) != pTbData->sl.pTail) {
71,969✔
670
        tbDataMovePosTo(pTbData, pos, &key, SL_MOVE_FROM_POS);
4,744✔
671
      }
672

673
      if ((code = tbDataDoPut(pMemTable, pTbData, pos, &tRow, 1))) goto _exit;
71,917!
674

675
      ++tRow.iRow;
72,009✔
676
    }
677
  }
678

679
  if (key.key.ts >= pTbData->maxKey) {
1,158✔
680
    pTbData->maxKey = key.key.ts;
1,133✔
681
  }
682

683
  if (!TSDB_CACHE_NO(pMemTable->pTsdb->pVnode->config) && !tsUpdateCacheBatch) {
1,158!
684
    if (tsdbCacheColFormatUpdate(pMemTable->pTsdb, pTbData->suid, pTbData->uid, pBlockData) != 0) {
×
685
      tsdbError("vgId:%d, failed to update cache data from table suid:%" PRId64 " uid:%" PRId64 " at version %" PRId64,
×
686
                TD_VID(pMemTable->pTsdb->pVnode), pTbData->suid, pTbData->uid, version);
687
    }
688
  }
689

690
  // SMemTable
691
  pMemTable->minKey = TMIN(pMemTable->minKey, pTbData->minKey);
1,156✔
692
  pMemTable->maxKey = TMAX(pMemTable->maxKey, pTbData->maxKey);
1,156✔
693
  pMemTable->nRow += pBlockData->nRow;
1,156✔
694

695
  if (affectedRows) *affectedRows = pBlockData->nRow;
1,156!
696

697
_exit:
×
698
  return code;
1,156✔
699
}
700

701
static int32_t tsdbInsertRowDataToTable(SMemTable *pMemTable, STbData *pTbData, int64_t version,
24,222,897✔
702
                                        SSubmitTbData *pSubmitTbData, int32_t *affectedRows) {
703
  int32_t code = 0;
24,222,897✔
704

705
  int32_t           nRow = TARRAY_SIZE(pSubmitTbData->aRowP);
24,222,897✔
706
  SRow            **aRow = (SRow **)TARRAY_DATA(pSubmitTbData->aRowP);
24,222,897✔
707
  STsdbRowKey       key;
708
  SMemSkipListNode *pos[SL_MAX_LEVEL];
709
  TSDBROW           tRow = {.type = TSDBROW_ROW_FMT, .version = version};
24,222,897✔
710
  int32_t           iRow = 0;
24,222,897✔
711

712
  // backward put first data
713
  tRow.pTSRow = aRow[iRow++];
24,222,897✔
714
  tsdbRowGetKey(&tRow, &key);
24,222,897✔
715
  tbDataMovePosTo(pTbData, pos, &key, SL_MOVE_BACKWARD);
24,222,882✔
716
  code = tbDataDoPut(pMemTable, pTbData, pos, &tRow, 0);
24,222,812✔
717
  if (code) goto _exit;
24,223,000!
718

719
  pTbData->minKey = TMIN(pTbData->minKey, key.key.ts);
24,223,000✔
720

721
  // forward put rest data
722
  if (iRow < nRow) {
24,223,000✔
723
    for (int8_t iLevel = pos[0]->level; iLevel < pTbData->sl.maxLevel; iLevel++) {
7,062,201✔
724
      pos[iLevel] = SL_NODE_BACKWARD(pos[iLevel], iLevel);
5,558,986✔
725
    }
726

727
    while (iRow < nRow) {
1,451,680,902✔
728
      tRow.pTSRow = aRow[iRow];
1,450,202,295✔
729
      tsdbRowGetKey(&tRow, &key);
1,450,202,295✔
730

731
      if (SL_NODE_FORWARD(pos[0], 0) != pTbData->sl.pTail) {
1,450,009,764✔
732
        tbDataMovePosTo(pTbData, pos, &key, SL_MOVE_FROM_POS);
43,815,716✔
733
      }
734

735
      code = tbDataDoPut(pMemTable, pTbData, pos, &tRow, 1);
1,450,005,706✔
736
      if (code) goto _exit;
1,450,177,687!
737

738
      iRow++;
1,450,177,687✔
739
    }
740
  }
741

742
  if (key.key.ts >= pTbData->maxKey) {
24,198,392✔
743
    pTbData->maxKey = key.key.ts;
23,984,435✔
744
  }
745
  if (!TSDB_CACHE_NO(pMemTable->pTsdb->pVnode->config) && !tsUpdateCacheBatch) {
24,198,392!
746
    TAOS_UNUSED(tsdbCacheRowFormatUpdate(pMemTable->pTsdb, pTbData->suid, pTbData->uid, version, nRow, aRow));
×
747
  }
748

749
  // SMemTable
750
  pMemTable->minKey = TMIN(pMemTable->minKey, pTbData->minKey);
24,222,961✔
751
  pMemTable->maxKey = TMAX(pMemTable->maxKey, pTbData->maxKey);
24,222,961✔
752
  pMemTable->nRow += nRow;
24,222,961✔
753

754
  if (affectedRows) *affectedRows = nRow;
24,222,961!
755

756
_exit:
×
757
  return code;
24,222,961✔
758
}
759

760
int32_t tsdbGetNRowsInTbData(STbData *pTbData) { return pTbData->sl.size; }
3,254✔
761

762
int32_t tsdbRefMemTable(SMemTable *pMemTable, SQueryNode *pQNode) {
7,531,484✔
763
  int32_t code = 0;
7,531,484✔
764

765
  int32_t nRef = atomic_fetch_add_32(&pMemTable->nRef, 1);
7,531,484✔
766
  if (nRef <= 0) {
7,538,422!
767
    tsdbError("vgId:%d, memtable ref count is invalid, ref:%d", TD_VID(pMemTable->pTsdb->pVnode), nRef);
×
768
  }
769

770
  vnodeBufPoolRegisterQuery(pMemTable->pPool, pQNode);
7,538,422✔
771

772
_exit:
7,537,844✔
773
  return code;
7,537,844✔
774
}
775

776
void tsdbUnrefMemTable(SMemTable *pMemTable, SQueryNode *pNode, bool proactive) {
7,572,221✔
777
  if (pNode) {
7,572,221✔
778
    vnodeBufPoolDeregisterQuery(pMemTable->pPool, pNode, proactive);
7,538,572✔
779
  }
780

781
  if (atomic_sub_fetch_32(&pMemTable->nRef, 1) == 0) {
7,572,841✔
782
    tsdbMemTableDestroy(pMemTable, proactive);
33,944✔
783
  }
784
}
7,573,185✔
785

786
static FORCE_INLINE int32_t tbDataPCmprFn(const void *p1, const void *p2) {
787
  STbData *pTbData1 = *(STbData **)p1;
788
  STbData *pTbData2 = *(STbData **)p2;
789

790
  if (pTbData1->suid < pTbData2->suid) {
791
    return -1;
792
  } else if (pTbData1->suid > pTbData2->suid) {
793
    return 1;
794
  }
795

796
  if (pTbData1->uid < pTbData2->uid) {
797
    return -1;
798
  } else if (pTbData1->uid > pTbData2->uid) {
799
    return 1;
800
  }
801

802
  return 0;
803
}
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc