• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #4986

15 Mar 2026 08:32AM UTC coverage: 37.305% (-31.3%) from 68.601%
#4986

push

travis-ci

tomchon
test: keep docs and unit test

125478 of 336361 relevant lines covered (37.3%)

1134847.06 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

4.86
/source/dnode/vnode/src/tsdb/tsdbCache.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15
#include "functionMgt.h"
16
#include "tsdb.h"
17
#include "tsdbDataFileRW.h"
18
#include "tsdbIter.h"
19
#include "tsdbReadUtil.h"
20
#include "tss.h"
21
#include "vnd.h"
22

23
#define ROCKS_BATCH_SIZE (4096)
24

25
void tsdbLRUCacheRelease(SLRUCache *cache, LRUHandle *handle, bool eraseIfLastRef) {
×
26
  if (!taosLRUCacheRelease(cache, handle, eraseIfLastRef)) {
×
27
    tsdbTrace(" release lru cache failed");
×
28
  }
29
}
×
30

31
#ifdef USE_SHARED_STORAGE
32

33
static int32_t tsdbOpenBCache(STsdb *pTsdb) {
×
34
  int32_t code = 0, lino = 0;
×
35
  int32_t szPage = pTsdb->pVnode->config.tsdbPageSize;
×
36
  int64_t szBlock = tsSsBlockSize <= 1024 ? 1024 : tsSsBlockSize;
×
37

38
  SLRUCache *pCache = taosLRUCacheInit((int64_t)tsSsBlockCacheSize * szBlock * szPage, 0, .5);
×
39
  if (pCache == NULL) {
×
40
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err);
×
41
  }
42

43
  taosLRUCacheSetStrictCapacity(pCache, false);
×
44

45
  (void)taosThreadMutexInit(&pTsdb->bMutex, NULL);
×
46

47
  pTsdb->bCache = pCache;
×
48

49
_err:
×
50
  if (code) {
×
51
    tsdbError("tsdb/bcache: vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, lino,
×
52
              tstrerror(code));
53
  }
54

55
  TAOS_RETURN(code);
×
56
}
57

58
static void tsdbCloseBCache(STsdb *pTsdb) {
×
59
  SLRUCache *pCache = pTsdb->bCache;
×
60
  if (pCache) {
×
61
    int32_t elems = taosLRUCacheGetElems(pCache);
×
62
    tsdbTrace("vgId:%d, elems: %d", TD_VID(pTsdb->pVnode), elems);
×
63
    taosLRUCacheEraseUnrefEntries(pCache);
×
64
    elems = taosLRUCacheGetElems(pCache);
×
65
    tsdbTrace("vgId:%d, elems: %d", TD_VID(pTsdb->pVnode), elems);
×
66

67
    taosLRUCacheCleanup(pCache);
×
68

69
    (void)taosThreadMutexDestroy(&pTsdb->bMutex);
×
70
  }
71
}
×
72

73
static int32_t tsdbOpenPgCache(STsdb *pTsdb) {
×
74
  int32_t code = 0, lino = 0;
×
75
  int32_t szPage = pTsdb->pVnode->config.tsdbPageSize;
×
76

77
  SLRUCache *pCache = taosLRUCacheInit((int64_t)tsSsPageCacheSize * szPage, 0, .5);
×
78
  if (pCache == NULL) {
×
79
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err);
×
80
  }
81

82
  taosLRUCacheSetStrictCapacity(pCache, false);
×
83

84
  (void)taosThreadMutexInit(&pTsdb->pgMutex, NULL);
×
85

86
  pTsdb->pgCache = pCache;
×
87

88
_err:
×
89
  if (code) {
×
90
    tsdbError("tsdb/pgcache: vgId:%d, open failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino, tstrerror(code));
×
91
  }
92

93
  TAOS_RETURN(code);
×
94
}
95

96
static void tsdbClosePgCache(STsdb *pTsdb) {
×
97
  SLRUCache *pCache = pTsdb->pgCache;
×
98
  if (pCache) {
×
99
    int32_t elems = taosLRUCacheGetElems(pCache);
×
100
    tsdbTrace("vgId:%d, elems: %d", TD_VID(pTsdb->pVnode), elems);
×
101
    taosLRUCacheEraseUnrefEntries(pCache);
×
102
    elems = taosLRUCacheGetElems(pCache);
×
103
    tsdbTrace("vgId:%d, elems: %d", TD_VID(pTsdb->pVnode), elems);
×
104

105
    taosLRUCacheCleanup(pCache);
×
106

107
    (void)taosThreadMutexDestroy(&pTsdb->bMutex);
×
108
  }
109
}
×
110

111
#endif  // USE_SHARED_STORAGE
112

113
#define ROCKS_KEY_LEN (sizeof(tb_uid_t) + sizeof(int16_t) + sizeof(int8_t))
114

115
enum {
116
  LFLAG_LAST_ROW = 0,
117
  LFLAG_LAST = 1,
118
};
119

120
typedef struct {
121
  tb_uid_t uid;
122
  int16_t  cid;
123
  int8_t   lflag;
124
} SLastKey;
125

126
#define IS_LAST_ROW_KEY(k) (((k).lflag & LFLAG_LAST) == LFLAG_LAST_ROW)
127
#define IS_LAST_KEY(k)     (((k).lflag & LFLAG_LAST) == LFLAG_LAST)
128

129
static void tsdbGetRocksPath(STsdb *pTsdb, char *path) {
40✔
130
  SVnode *pVnode = pTsdb->pVnode;
40✔
131
  vnodeGetPrimaryPath(pVnode, false, path, TSDB_FILENAME_LEN);
40✔
132

133
  int32_t offset = strlen(path);
40✔
134
  snprintf(path + offset, TSDB_FILENAME_LEN - offset - 1, "%s%s%scache.rdb", TD_DIRSEP, pTsdb->name, TD_DIRSEP);
40✔
135
}
40✔
136

137
static const char *myCmpName(void *state) {
200✔
138
  (void)state;
139
  return "myCmp";
200✔
140
}
141

142
static void myCmpDestroy(void *state) { (void)state; }
40✔
143

144
static int myCmp(void *state, const char *a, size_t alen, const char *b, size_t blen) {
×
145
  (void)state;
146
  (void)alen;
147
  (void)blen;
148
  SLastKey *lhs = (SLastKey *)a;
×
149
  SLastKey *rhs = (SLastKey *)b;
×
150

151
  if (lhs->uid < rhs->uid) {
×
152
    return -1;
×
153
  } else if (lhs->uid > rhs->uid) {
×
154
    return 1;
×
155
  }
156

157
  if (lhs->cid < rhs->cid) {
×
158
    return -1;
×
159
  } else if (lhs->cid > rhs->cid) {
×
160
    return 1;
×
161
  }
162

163
  if ((lhs->lflag & LFLAG_LAST) < (rhs->lflag & LFLAG_LAST)) {
×
164
    return -1;
×
165
  } else if ((lhs->lflag & LFLAG_LAST) > (rhs->lflag & LFLAG_LAST)) {
×
166
    return 1;
×
167
  }
168

169
  return 0;
×
170
}
171

172
static int32_t tsdbOpenRocksCache(STsdb *pTsdb) {
40✔
173
  int32_t code = 0, lino = 0;
40✔
174
#ifdef USE_ROCKSDB
175
  rocksdb_comparator_t *cmp = rocksdb_comparator_create(NULL, myCmpDestroy, myCmp, myCmpName);
40✔
176
  if (NULL == cmp) {
40✔
177
    TAOS_RETURN(TSDB_CODE_OUT_OF_MEMORY);
×
178
  }
179

180
  rocksdb_block_based_table_options_t *tableoptions = rocksdb_block_based_options_create();
40✔
181
  pTsdb->rCache.tableoptions = tableoptions;
40✔
182

183
  rocksdb_options_t *options = rocksdb_options_create();
40✔
184
  if (NULL == options) {
40✔
185
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err);
×
186
  }
187

188
  rocksdb_options_set_create_if_missing(options, 1);
40✔
189
  rocksdb_options_set_comparator(options, cmp);
40✔
190
  rocksdb_options_set_block_based_table_factory(options, tableoptions);
40✔
191
  rocksdb_options_set_info_log_level(options, 2);  // WARN_LEVEL
40✔
192
  // rocksdb_options_set_inplace_update_support(options, 1);
193
  // rocksdb_options_set_allow_concurrent_memtable_write(options, 0);
194

195
  rocksdb_writeoptions_t *writeoptions = rocksdb_writeoptions_create();
40✔
196
  if (NULL == writeoptions) {
40✔
197
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err2);
×
198
  }
199
  rocksdb_writeoptions_disable_WAL(writeoptions, 1);
40✔
200

201
  rocksdb_readoptions_t *readoptions = rocksdb_readoptions_create();
40✔
202
  if (NULL == readoptions) {
40✔
203
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err3);
×
204
  }
205

206
  char *err = NULL;
40✔
207
  char  cachePath[TSDB_FILENAME_LEN] = {0};
40✔
208
  tsdbGetRocksPath(pTsdb, cachePath);
40✔
209

210
  rocksdb_t *db = rocksdb_open(options, cachePath, &err);
40✔
211
  if (NULL == db) {
40✔
212
    tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, err);
×
213
    rocksdb_free(err);
×
214

215
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err4);
×
216
  }
217

218
  rocksdb_flushoptions_t *flushoptions = rocksdb_flushoptions_create();
40✔
219
  if (NULL == flushoptions) {
40✔
220
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err5);
×
221
  }
222

223
  rocksdb_writebatch_t *writebatch = rocksdb_writebatch_create();
40✔
224

225
  TAOS_CHECK_GOTO(taosThreadMutexInit(&pTsdb->rCache.writeBatchMutex, NULL), &lino, _err6);
40✔
226

227
  pTsdb->rCache.writebatch = writebatch;
40✔
228
  pTsdb->rCache.my_comparator = cmp;
40✔
229
  pTsdb->rCache.options = options;
40✔
230
  pTsdb->rCache.writeoptions = writeoptions;
40✔
231
  pTsdb->rCache.readoptions = readoptions;
40✔
232
  pTsdb->rCache.flushoptions = flushoptions;
40✔
233
  pTsdb->rCache.db = db;
40✔
234
  pTsdb->rCache.sver = -1;
40✔
235
  pTsdb->rCache.suid = -1;
40✔
236
  pTsdb->rCache.uid = -1;
40✔
237
  pTsdb->rCache.pTSchema = NULL;
40✔
238
  pTsdb->rCache.ctxArray = taosArrayInit(16, sizeof(SLastUpdateCtx));
40✔
239
  if (!pTsdb->rCache.ctxArray) {
40✔
240
    TAOS_CHECK_GOTO(terrno, &lino, _err7);
×
241
  }
242

243
  TAOS_RETURN(code);
40✔
244

245
_err7:
×
246
  (void)taosThreadMutexDestroy(&pTsdb->rCache.writeBatchMutex);
×
247
_err6:
×
248
  rocksdb_writebatch_destroy(writebatch);
×
249
_err5:
×
250
  rocksdb_close(pTsdb->rCache.db);
×
251
_err4:
×
252
  rocksdb_readoptions_destroy(readoptions);
×
253
_err3:
×
254
  rocksdb_writeoptions_destroy(writeoptions);
×
255
_err2:
×
256
  rocksdb_options_destroy(options);
×
257
  rocksdb_block_based_options_destroy(tableoptions);
×
258
_err:
×
259
  rocksdb_comparator_destroy(cmp);
×
260
#endif
261
  TAOS_RETURN(code);
×
262
}
263

264
static void tsdbCloseRocksCache(STsdb *pTsdb) {
40✔
265
#ifdef USE_ROCKSDB
266
  rocksdb_close(pTsdb->rCache.db);
40✔
267
  (void)taosThreadMutexDestroy(&pTsdb->rCache.writeBatchMutex);
40✔
268
  rocksdb_flushoptions_destroy(pTsdb->rCache.flushoptions);
40✔
269
  rocksdb_writebatch_destroy(pTsdb->rCache.writebatch);
40✔
270
  rocksdb_readoptions_destroy(pTsdb->rCache.readoptions);
40✔
271
  rocksdb_writeoptions_destroy(pTsdb->rCache.writeoptions);
40✔
272
  rocksdb_options_destroy(pTsdb->rCache.options);
40✔
273
  rocksdb_block_based_options_destroy(pTsdb->rCache.tableoptions);
40✔
274
  rocksdb_comparator_destroy(pTsdb->rCache.my_comparator);
40✔
275
  taosMemoryFree(pTsdb->rCache.pTSchema);
40✔
276
  taosArrayDestroy(pTsdb->rCache.ctxArray);
40✔
277
#endif
278
}
40✔
279

280
static void rocksMayWrite(STsdb *pTsdb, bool force) {
16✔
281
#ifdef USE_ROCKSDB
282
  rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
16✔
283

284
  int count = rocksdb_writebatch_count(wb);
16✔
285
  if ((force && count > 0) || count >= ROCKS_BATCH_SIZE) {
16✔
286
    char *err = NULL;
×
287

288
    rocksdb_write(pTsdb->rCache.db, pTsdb->rCache.writeoptions, wb, &err);
×
289
    if (NULL != err) {
×
290
      tsdbError("vgId:%d, %s failed at line %d, count: %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, count,
×
291
                err);
292
      rocksdb_free(err);
×
293
    }
294

295
    rocksdb_writebatch_clear(wb);
×
296
  }
297
#endif
298
}
16✔
299

300
typedef struct {
301
  TSKEY  ts;
302
  int8_t dirty;
303
  struct {
304
    int16_t cid;
305
    int8_t  type;
306
    int8_t  flag;
307
    union {
308
      int64_t val;
309
      struct {
310
        uint32_t nData;
311
        uint8_t *pData;
312
      };
313
    } value;
314
  } colVal;
315
} SLastColV0;
316

317
static int32_t tsdbCacheDeserializeV0(char const *value, SLastCol *pLastCol) {
×
318
  SLastColV0 *pLastColV0 = (SLastColV0 *)value;
×
319

320
  pLastCol->rowKey.ts = pLastColV0->ts;
×
321
  pLastCol->rowKey.numOfPKs = 0;
×
322
  pLastCol->dirty = pLastColV0->dirty;
×
323
  pLastCol->colVal.cid = pLastColV0->colVal.cid;
×
324
  pLastCol->colVal.flag = pLastColV0->colVal.flag;
×
325
  pLastCol->colVal.value.type = pLastColV0->colVal.type;
×
326

327
  pLastCol->cacheStatus = TSDB_LAST_CACHE_VALID;
×
328

329
  if (IS_VAR_DATA_TYPE(pLastCol->colVal.value.type)) {
×
330
    pLastCol->colVal.value.nData = pLastColV0->colVal.value.nData;
×
331
    pLastCol->colVal.value.pData = NULL;
×
332
    if (pLastCol->colVal.value.nData > 0) {
×
333
      pLastCol->colVal.value.pData = (uint8_t *)(&pLastColV0[1]);
×
334
    }
335
    return sizeof(SLastColV0) + pLastColV0->colVal.value.nData;
×
336
  } else if (pLastCol->colVal.value.type == TSDB_DATA_TYPE_DECIMAL) {
×
337
    pLastCol->colVal.value.nData = pLastColV0->colVal.value.nData;
×
338
    pLastCol->colVal.value.pData = (uint8_t *)(&pLastColV0[1]);
×
339
    return sizeof(SLastColV0) + pLastColV0->colVal.value.nData;
×
340
  } else {
341
    pLastCol->colVal.value.val = pLastColV0->colVal.value.val;
×
342
    return sizeof(SLastColV0);
×
343
  }
344
}
345

346
static int32_t tsdbCacheDeserialize(char const *value, size_t size, SLastCol **ppLastCol) {
×
347
  if (!value) {
×
348
    return TSDB_CODE_INVALID_PARA;
×
349
  }
350

351
  SLastCol *pLastCol = taosMemoryCalloc(1, sizeof(SLastCol));
×
352
  if (NULL == pLastCol) {
×
353
    return terrno;
×
354
  }
355

356
  int32_t offset = tsdbCacheDeserializeV0(value, pLastCol);
×
357
  if (offset == size) {
×
358
    // version 0
359
    *ppLastCol = pLastCol;
×
360

361
    TAOS_RETURN(TSDB_CODE_SUCCESS);
×
362
  } else if (offset > size) {
×
363
    taosMemoryFreeClear(pLastCol);
×
364

365
    TAOS_RETURN(TSDB_CODE_INVALID_DATA_FMT);
×
366
  }
367

368
  // version
369
  int8_t version = *(int8_t *)(value + offset);
×
370
  offset += sizeof(int8_t);
×
371

372
  // numOfPKs
373
  pLastCol->rowKey.numOfPKs = *(uint8_t *)(value + offset);
×
374
  offset += sizeof(uint8_t);
×
375

376
  // pks
377
  for (int32_t i = 0; i < pLastCol->rowKey.numOfPKs; i++) {
×
378
    pLastCol->rowKey.pks[i] = *(SValue *)(value + offset);
×
379
    offset += sizeof(SValue);
×
380

381
    if (IS_VAR_DATA_TYPE(pLastCol->rowKey.pks[i].type)) {
×
382
      pLastCol->rowKey.pks[i].pData = NULL;
×
383
      if (pLastCol->rowKey.pks[i].nData > 0) {
×
384
        pLastCol->rowKey.pks[i].pData = (uint8_t *)value + offset;
×
385
        offset += pLastCol->rowKey.pks[i].nData;
×
386
      }
387
    }
388
  }
389

390
  if (version >= LAST_COL_VERSION_2) {
×
391
    pLastCol->cacheStatus = *(uint8_t *)(value + offset);
×
392
  }
393

394
  if (offset > size) {
×
395
    taosMemoryFreeClear(pLastCol);
×
396

397
    TAOS_RETURN(TSDB_CODE_INVALID_DATA_FMT);
×
398
  }
399

400
  *ppLastCol = pLastCol;
×
401

402
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
403
}
404

405
/*
406
typedef struct {
407
  SLastColV0 lastColV0;
408
  char       colData[];
409
  int8_t     version;
410
  uint8_t    numOfPKs;
411
  SValue     pks[0];
412
  char       pk0Data[];
413
  SValue     pks[1];
414
  char       pk1Data[];
415
  ...
416
} SLastColDisk;
417
*/
418
static int32_t tsdbCacheSerializeV0(char const *value, SLastCol *pLastCol) {
×
419
  SLastColV0 *pLastColV0 = (SLastColV0 *)value;
×
420

421
  pLastColV0->ts = pLastCol->rowKey.ts;
×
422
  pLastColV0->dirty = pLastCol->dirty;
×
423
  pLastColV0->colVal.cid = pLastCol->colVal.cid;
×
424
  pLastColV0->colVal.flag = pLastCol->colVal.flag;
×
425
  pLastColV0->colVal.type = pLastCol->colVal.value.type;
×
426
  if (IS_VAR_DATA_TYPE(pLastCol->colVal.value.type)) {
×
427
    pLastColV0->colVal.value.nData = pLastCol->colVal.value.nData;
×
428
    if (pLastCol->colVal.value.nData > 0) {
×
429
      memcpy(&pLastColV0[1], pLastCol->colVal.value.pData, pLastCol->colVal.value.nData);
×
430
    }
431
    return sizeof(SLastColV0) + pLastCol->colVal.value.nData;
×
432
  } else if (pLastCol->colVal.value.type == TSDB_DATA_TYPE_DECIMAL) {
×
433
    pLastColV0->colVal.value.nData = pLastCol->colVal.value.nData;
×
434
    if (pLastCol->colVal.value.nData > 0) {
×
435
      memcpy(&pLastColV0[1], pLastCol->colVal.value.pData, pLastCol->colVal.value.nData);
×
436
    }
437
    return sizeof(SLastColV0) + pLastCol->colVal.value.nData;
×
438
  } else {
439
    pLastColV0->colVal.value.val = pLastCol->colVal.value.val;
×
440
    return sizeof(SLastColV0);
×
441
  }
442

443
  return 0;
444
}
445

446
static int32_t tsdbCacheSerialize(SLastCol *pLastCol, char **value, size_t *size) {
×
447
  *size = sizeof(SLastColV0);
×
448
  if (IS_VAR_DATA_TYPE(pLastCol->colVal.value.type)) {
×
449
    *size += pLastCol->colVal.value.nData;
×
450
  }
451
  if (pLastCol->colVal.value.type == TSDB_DATA_TYPE_DECIMAL) {
×
452
    *size += DECIMAL128_BYTES;
×
453
  }
454
  *size += sizeof(uint8_t) + sizeof(uint8_t) + sizeof(uint8_t);  // version + numOfPKs + cacheStatus
×
455

456
  for (int8_t i = 0; i < pLastCol->rowKey.numOfPKs; i++) {
×
457
    *size += sizeof(SValue);
×
458
    if (IS_VAR_DATA_TYPE(pLastCol->rowKey.pks[i].type)) {
×
459
      *size += pLastCol->rowKey.pks[i].nData;
×
460
    }
461
  }
462

463
  *value = taosMemoryMalloc(*size);
×
464
  if (NULL == *value) {
×
465
    TAOS_RETURN(terrno);
×
466
  }
467

468
  int32_t offset = tsdbCacheSerializeV0(*value, pLastCol);
×
469

470
  // version
471
  ((uint8_t *)(*value + offset))[0] = LAST_COL_VERSION;
×
472
  offset++;
×
473

474
  // numOfPKs
475
  ((uint8_t *)(*value + offset))[0] = pLastCol->rowKey.numOfPKs;
×
476
  offset++;
×
477

478
  // pks
479
  for (int8_t i = 0; i < pLastCol->rowKey.numOfPKs; i++) {
×
480
    ((SValue *)(*value + offset))[0] = pLastCol->rowKey.pks[i];
×
481
    offset += sizeof(SValue);
×
482
    if (IS_VAR_DATA_TYPE(pLastCol->rowKey.pks[i].type)) {
×
483
      if (pLastCol->rowKey.pks[i].nData > 0) {
×
484
        memcpy(*value + offset, pLastCol->rowKey.pks[i].pData, pLastCol->rowKey.pks[i].nData);
×
485
      }
486
      offset += pLastCol->rowKey.pks[i].nData;
×
487
    }
488
  }
489

490
  ((uint8_t *)(*value + offset))[0] = pLastCol->cacheStatus;
×
491

492
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
493
}
494

495
static int32_t tsdbCachePutToRocksdb(STsdb *pTsdb, SLastKey *pLastKey, SLastCol *pLastCol);
496

497
int tsdbCacheFlushDirty(const void *key, size_t klen, void *value, void *ud) {
×
498
  SLastCol *pLastCol = (SLastCol *)value;
×
499

500
  if (pLastCol->dirty) {
×
501
    STsdb *pTsdb = (STsdb *)ud;
×
502

503
    int32_t code = tsdbCachePutToRocksdb(pTsdb, (SLastKey *)key, pLastCol);
×
504
    if (code) {
×
505
      tsdbError("tsdb/cache: vgId:%d, flush dirty lru failed since %s.", TD_VID(pTsdb->pVnode), tstrerror(code));
×
506
      return code;
×
507
    }
508

509
    pLastCol->dirty = 0;
×
510

511
    rocksMayWrite(pTsdb, false);
×
512
  }
513

514
  return 0;
×
515
}
516

517
static bool tsdbKeyDeleted(TSDBKEY *key, SArray *pSkyline, int64_t *iSkyline) {
×
518
  bool deleted = false;
×
519
  while (*iSkyline > 0) {
×
520
    TSDBKEY *pItemBack = (TSDBKEY *)taosArrayGet(pSkyline, *iSkyline);
×
521
    TSDBKEY *pItemFront = (TSDBKEY *)taosArrayGet(pSkyline, *iSkyline - 1);
×
522

523
    if (key->ts > pItemBack->ts) {
×
524
      return false;
×
525
    } else if (key->ts >= pItemFront->ts && key->ts <= pItemBack->ts) {
×
526
      if (key->version <= pItemFront->version || (key->ts == pItemBack->ts && key->version <= pItemBack->version)) {
×
527
        // if (key->version <= pItemFront->version || key->version <= pItemBack->version) {
528
        return true;
×
529
      } else {
530
        if (*iSkyline > 1) {
×
531
          --*iSkyline;
×
532
        } else {
533
          return false;
×
534
        }
535
      }
536
    } else {
537
      if (*iSkyline > 1) {
×
538
        --*iSkyline;
×
539
      } else {
540
        return false;
×
541
      }
542
    }
543
  }
544

545
  return deleted;
×
546
}
547

548
// Get next non-deleted row from imem
549
static TSDBROW *tsdbImemGetNextRow(STbDataIter *pTbIter, SArray *pSkyline, int64_t *piSkyline) {
×
550
  int32_t code = 0;
×
551

552
  if (tsdbTbDataIterNext(pTbIter)) {
×
553
    TSDBROW *pMemRow = tsdbTbDataIterGet(pTbIter);
×
554
    TSDBKEY  rowKey = TSDBROW_KEY(pMemRow);
×
555
    bool     deleted = tsdbKeyDeleted(&rowKey, pSkyline, piSkyline);
×
556
    if (!deleted) {
×
557
      return pMemRow;
×
558
    }
559
  }
560

561
  return NULL;
×
562
}
563

564
// Get first non-deleted row from imem
565
static TSDBROW *tsdbImemGetFirstRow(SMemTable *imem, STbData *pIMem, STbDataIter *pTbIter, SArray *pSkyline,
×
566
                                    int64_t *piSkyline) {
567
  int32_t code = 0;
×
568

569
  tsdbTbDataIterOpen(pIMem, NULL, 1, pTbIter);
×
570
  TSDBROW *pMemRow = tsdbTbDataIterGet(pTbIter);
×
571
  if (pMemRow) {
×
572
    // if non deleted, return the found row.
573
    TSDBKEY rowKey = TSDBROW_KEY(pMemRow);
×
574
    bool    deleted = tsdbKeyDeleted(&rowKey, pSkyline, piSkyline);
×
575
    if (!deleted) {
×
576
      return pMemRow;
×
577
    }
578
  } else {
579
    return NULL;
×
580
  }
581

582
  // continue to find the non-deleted first row from imem, using get next row
583
  return tsdbImemGetNextRow(pTbIter, pSkyline, piSkyline);
×
584
}
585

586
void tsdbCacheInvalidateSchema(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, int32_t sver) {
×
587
  SRocksCache *pRCache = &pTsdb->rCache;
×
588
  if (!pRCache->pTSchema || sver <= pTsdb->rCache.sver) return;
×
589

590
  if (suid > 0 && suid == pRCache->suid) {
×
591
    pRCache->sver = -1;
×
592
    pRCache->suid = -1;
×
593
  }
594
  if (suid == 0 && uid == pRCache->uid) {
×
595
    pRCache->sver = -1;
×
596
    pRCache->uid = -1;
×
597
  }
598
}
599

600
static int32_t tsdbUpdateSkm(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, int32_t sver) {
×
601
  SRocksCache *pRCache = &pTsdb->rCache;
×
602
  if (pRCache->pTSchema && sver == pRCache->sver) {
×
603
    if (suid > 0 && suid == pRCache->suid) {
×
604
      return 0;
×
605
    }
606
    if (suid == 0 && uid == pRCache->uid) {
×
607
      return 0;
×
608
    }
609
  }
610

611
  pRCache->suid = suid;
×
612
  pRCache->uid = uid;
×
613
  pRCache->sver = sver;
×
614
  tDestroyTSchema(pRCache->pTSchema);
×
615
  return metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, uid, sver, &pRCache->pTSchema);
×
616
}
617

618
static int32_t tsdbCacheUpdate(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, SArray *updCtxArray);
619

620
int32_t tsdbLoadFromImem(SMemTable *imem, int64_t suid, int64_t uid) {
×
621
  int32_t      code = 0;
×
622
  int32_t      lino = 0;
×
623
  STsdb       *pTsdb = imem->pTsdb;
×
624
  SArray      *pMemDelData = NULL;
×
625
  SArray      *pSkyline = NULL;
×
626
  int64_t      iSkyline = 0;
×
627
  STbDataIter  tbIter = {0};
×
628
  TSDBROW     *pMemRow = NULL;
×
629
  STSchema    *pTSchema = NULL;
×
630
  SSHashObj   *iColHash = NULL;
×
631
  int32_t      sver;
632
  int32_t      nCol;
633
  SArray      *ctxArray = pTsdb->rCache.ctxArray;
×
634
  STsdbRowKey  tsdbRowKey = {0};
×
635
  STSDBRowIter iter = {0};
×
636

637
  STbData *pIMem = tsdbGetTbDataFromMemTable(imem, suid, uid);
×
638

639
  // load imem tomb data and build skyline
640
  TAOS_CHECK_GOTO(loadMemTombData(&pMemDelData, NULL, pIMem, INT64_MAX), &lino, _exit);
×
641

642
  // tsdbBuildDeleteSkyline
643
  size_t delSize = TARRAY_SIZE(pMemDelData);
×
644
  if (delSize > 0) {
×
645
    pSkyline = taosArrayInit(32, sizeof(TSDBKEY));
×
646
    if (!pSkyline) {
×
647
      TAOS_CHECK_EXIT(terrno);
×
648
    }
649

650
    TAOS_CHECK_EXIT(tsdbBuildDeleteSkyline(pMemDelData, 0, (int32_t)(delSize - 1), pSkyline));
×
651
    iSkyline = taosArrayGetSize(pSkyline) - 1;
×
652
  }
653

654
  pMemRow = tsdbImemGetFirstRow(imem, pIMem, &tbIter, pSkyline, &iSkyline);
×
655
  if (!pMemRow) {
×
656
    goto _exit;
×
657
  }
658

659
  // iter first row to last_row/last col values to ctxArray, and mark last null col ids
660
  sver = TSDBROW_SVERSION(pMemRow);
×
661
  TAOS_CHECK_GOTO(tsdbUpdateSkm(pTsdb, suid, uid, sver), &lino, _exit);
×
662
  pTSchema = pTsdb->rCache.pTSchema;
×
663
  nCol = pTSchema->numOfCols;
×
664

665
  tsdbRowGetKey(pMemRow, &tsdbRowKey);
×
666

667
  TAOS_CHECK_EXIT(tsdbRowIterOpen(&iter, pMemRow, pTSchema));
×
668

669
  int32_t iCol = 0;
×
670
  for (SColVal *pColVal = tsdbRowIterNext(&iter); pColVal && iCol < nCol; pColVal = tsdbRowIterNext(&iter), iCol++) {
×
671
    SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST_ROW, .tsdbRowKey = tsdbRowKey, .colVal = *pColVal};
×
672
    if (!taosArrayPush(ctxArray, &updateCtx)) {
×
673
      TAOS_CHECK_EXIT(terrno);
×
674
    }
675

676
    if (COL_VAL_IS_VALUE(pColVal)) {
×
677
      updateCtx.lflag = LFLAG_LAST;
×
678
      if (!taosArrayPush(ctxArray, &updateCtx)) {
×
679
        TAOS_CHECK_EXIT(terrno);
×
680
      }
681
    } else {
682
      if (!iColHash) {
×
683
        iColHash = tSimpleHashInit(16, taosGetDefaultHashFunction(TSDB_DATA_TYPE_SMALLINT));
×
684
        if (iColHash == NULL) {
×
685
          TAOS_CHECK_EXIT(terrno);
×
686
        }
687
      }
688

689
      if (tSimpleHashPut(iColHash, &pColVal->cid, sizeof(pColVal->cid), &pColVal->cid, sizeof(pColVal->cid))) {
×
690
        TAOS_CHECK_EXIT(terrno);
×
691
      }
692
    }
693
  }
694
  tsdbRowClose(&iter);
×
695

696
  // continue to get next row to fill null last col values
697
  pMemRow = tsdbImemGetNextRow(&tbIter, pSkyline, &iSkyline);
×
698
  while (pMemRow) {
×
699
    if (tSimpleHashGetSize(iColHash) == 0) {
×
700
      break;
×
701
    }
702

703
    sver = TSDBROW_SVERSION(pMemRow);
×
704
    TAOS_CHECK_EXIT(tsdbUpdateSkm(pTsdb, suid, uid, sver));
×
705
    pTSchema = pTsdb->rCache.pTSchema;
×
706

707
    STsdbRowKey tsdbRowKey = {0};
×
708
    tsdbRowGetKey(pMemRow, &tsdbRowKey);
×
709

710
    TAOS_CHECK_EXIT(tsdbRowIterOpen(&iter, pMemRow, pTSchema));
×
711

712
    int32_t iCol = 0;
×
713
    for (SColVal *pColVal = tsdbRowIterNext(&iter); pColVal && iCol < nCol; pColVal = tsdbRowIterNext(&iter), iCol++) {
×
714
      if (tSimpleHashGet(iColHash, &pColVal->cid, sizeof(pColVal->cid)) && COL_VAL_IS_VALUE(pColVal)) {
×
715
        SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST, .tsdbRowKey = tsdbRowKey, .colVal = *pColVal};
×
716
        if (!taosArrayPush(ctxArray, &updateCtx)) {
×
717
          TAOS_CHECK_EXIT(terrno);
×
718
        }
719

720
        TAOS_CHECK_EXIT(tSimpleHashRemove(iColHash, &pColVal->cid, sizeof(pColVal->cid)));
×
721
      }
722
    }
723
    tsdbRowClose(&iter);
×
724

725
    pMemRow = tsdbImemGetNextRow(&tbIter, pSkyline, &iSkyline);
×
726
  }
727

728
  TAOS_CHECK_GOTO(tsdbCacheUpdate(pTsdb, suid, uid, ctxArray), &lino, _exit);
×
729

730
_exit:
×
731
  if (code) {
×
732
    tsdbError("vgId:%d %s failed at %s:%d since %s", TD_VID(pTsdb->pVnode), __func__, __FILE__, lino, tstrerror(code));
×
733

734
    tsdbRowClose(&iter);
×
735
  }
736

737
  taosArrayClear(ctxArray);
×
738
  // destroy any allocated resource
739
  tSimpleHashCleanup(iColHash);
×
740
  if (pMemDelData) {
×
741
    taosArrayDestroy(pMemDelData);
×
742
  }
743
  if (pSkyline) {
×
744
    taosArrayDestroy(pSkyline);
×
745
  }
746

747
  TAOS_RETURN(code);
×
748
}
749

750
static int32_t tsdbCacheUpdateFromIMem(STsdb *pTsdb) {
×
751
  if (!pTsdb) return 0;
×
752
  if (!pTsdb->imem) return 0;
×
753

754
  int32_t    code = 0;
×
755
  int32_t    lino = 0;
×
756
  SMemTable *imem = pTsdb->imem;
×
757
  int32_t    nTbData = imem->nTbData;
×
758
  int64_t    nRow = imem->nRow;
×
759
  int64_t    nDel = imem->nDel;
×
760

761
  if (nRow == 0 || nTbData == 0) return 0;
×
762

763
  TAOS_CHECK_EXIT(tsdbMemTableSaveToCache(imem, tsdbLoadFromImem));
×
764

765
_exit:
×
766
  if (code) {
×
767
    tsdbError("vgId:%d %s failed at %s:%d since %s", TD_VID(pTsdb->pVnode), __func__, __FILE__, lino, tstrerror(code));
×
768
  } else {
769
    tsdbInfo("vgId:%d %s done, nRow:%" PRId64 " nDel:%" PRId64, TD_VID(pTsdb->pVnode), __func__, nRow, nDel);
×
770
  }
771

772
  TAOS_RETURN(code);
×
773
}
774

775
int32_t tsdbCacheCommit(STsdb *pTsdb) {
×
776
  int32_t code = 0;
×
777

778
  // 0, tsdbCacheUpdateFromIMem if updateCacheBatch
779
  // flush dirty data of lru into rocks
780
  // 4, and update when writing if !updateCacheBatch
781
  // 5, merge cache & mem if updateCacheBatch
782

783
  if (tsUpdateCacheBatch) {
×
784
    code = tsdbCacheUpdateFromIMem(pTsdb);
×
785
    if (code) {
×
786
      tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
787

788
      TAOS_RETURN(code);
×
789
    }
790
  }
791

792
  char      *err = NULL;
×
793
  SLRUCache *pCache = pTsdb->lruCache;
×
794
  // rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
795

796
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
797

798
  taosLRUCacheApply(pCache, tsdbCacheFlushDirty, pTsdb);
×
799

800
#ifdef USE_ROCKSDB
801
  rocksMayWrite(pTsdb, true);
×
802
  rocksdb_flush(pTsdb->rCache.db, pTsdb->rCache.flushoptions, &err);
×
803
#endif
804
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
805
#ifdef USE_ROCKSDB
806
  if (NULL != err) {
×
807
    tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, err);
×
808
    rocksdb_free(err);
×
809
    code = TSDB_CODE_FAILED;
×
810
  }
811
#endif
812
  TAOS_RETURN(code);
×
813
}
814

815
static int32_t reallocVarDataVal(SValue *pValue) {
×
816
  if (IS_VAR_DATA_TYPE(pValue->type)) {
×
817
    uint8_t *pVal = pValue->pData;
×
818
    uint32_t nData = pValue->nData;
×
819
    if (nData > 0) {
×
820
      uint8_t *p = taosMemoryMalloc(nData);
×
821
      if (!p) {
×
822
        TAOS_RETURN(terrno);
×
823
      }
824
      pValue->pData = p;
×
825
      (void)memcpy(pValue->pData, pVal, nData);
×
826
    } else {
827
      pValue->pData = NULL;
×
828
    }
829
  }
830

831
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
832
}
833

834
static int32_t reallocVarData(SColVal *pColVal) { return reallocVarDataVal(&pColVal->value); }
×
835

836
// realloc pk data and col data.
837
static int32_t tsdbCacheReallocSLastCol(SLastCol *pCol, size_t *pCharge) {
×
838
  int32_t code = TSDB_CODE_SUCCESS, lino = 0;
×
839
  size_t  charge = sizeof(SLastCol);
×
840

841
  int8_t i = 0;
×
842
  for (; i < pCol->rowKey.numOfPKs; i++) {
×
843
    SValue *pValue = &pCol->rowKey.pks[i];
×
844
    if (IS_VAR_DATA_TYPE(pValue->type)) {
×
845
      TAOS_CHECK_EXIT(reallocVarDataVal(pValue));
×
846
      charge += pValue->nData;
×
847
    }
848
  }
849

850
  if (IS_VAR_DATA_TYPE(pCol->colVal.value.type)) {
×
851
    TAOS_CHECK_EXIT(reallocVarData(&pCol->colVal));
×
852
    charge += pCol->colVal.value.nData;
×
853
  }
854

855
  if (pCol->colVal.value.type == TSDB_DATA_TYPE_DECIMAL) {
×
856
    if (pCol->colVal.value.nData > 0) {
×
857
      void *p = taosMemoryMalloc(pCol->colVal.value.nData);
×
858
      if (!p) TAOS_CHECK_EXIT(terrno);
×
859
      (void)memcpy(p, pCol->colVal.value.pData, pCol->colVal.value.nData);
×
860
      pCol->colVal.value.pData = p;
×
861
    }else {
862
      pCol->colVal.value.pData = NULL;
×
863
    }
864
    charge += pCol->colVal.value.nData;
×
865
  }
866

867
  if (pCharge) {
×
868
    *pCharge = charge;
×
869
  }
870

871
_exit:
×
872
  if (TSDB_CODE_SUCCESS != code) {
×
873
    for (int8_t j = 0; j < i; j++) {
×
874
      if (IS_VAR_DATA_TYPE(pCol->rowKey.pks[j].type)) {
×
875
        taosMemoryFree(pCol->rowKey.pks[j].pData);
×
876
      }
877
    }
878

879
    (void)memset(pCol, 0, sizeof(SLastCol));
×
880
  }
881

882
  TAOS_RETURN(code);
×
883
}
884

885
void tsdbCacheFreeSLastColItem(void *pItem) {
×
886
  SLastCol *pCol = (SLastCol *)pItem;
×
887
  for (int i = 0; i < pCol->rowKey.numOfPKs; i++) {
×
888
    if (IS_VAR_DATA_TYPE(pCol->rowKey.pks[i].type)) {
×
889
      taosMemoryFree(pCol->rowKey.pks[i].pData);
×
890
    }
891
  }
892

893
  if ((IS_VAR_DATA_TYPE(pCol->colVal.value.type) || pCol->colVal.value.type == TSDB_DATA_TYPE_DECIMAL) &&
×
894
      pCol->colVal.value.pData) {
×
895
    taosMemoryFree(pCol->colVal.value.pData);
×
896
  }
897
}
×
898

899
static void tsdbCacheDeleter(const void *key, size_t klen, void *value, void *ud) {
×
900
  SLastCol *pLastCol = (SLastCol *)value;
×
901

902
  if (pLastCol->dirty) {
×
903
    if (tsdbCacheFlushDirty(key, klen, pLastCol, ud) != 0) {
×
904
      STsdb *pTsdb = (STsdb *)ud;
×
905
      tsdbTrace("tsdb/cache: vgId:%d, flush cache %s failed at line %d.", TD_VID(pTsdb->pVnode), __func__, __LINE__);
×
906
    }
907
  }
908

909
  for (uint8_t i = 0; i < pLastCol->rowKey.numOfPKs; ++i) {
×
910
    SValue *pValue = &pLastCol->rowKey.pks[i];
×
911
    if (IS_VAR_DATA_TYPE(pValue->type)) {
×
912
      taosMemoryFree(pValue->pData);
×
913
    }
914
  }
915

916
  if (IS_VAR_DATA_TYPE(pLastCol->colVal.value.type) ||
×
917
      pLastCol->colVal.value.type == TSDB_DATA_TYPE_DECIMAL /* && pLastCol->colVal.value.nData > 0*/) {
×
918
    taosMemoryFree(pLastCol->colVal.value.pData);
×
919
  }
920

921
  taosMemoryFree(value);
×
922
}
×
923

924
static void tsdbCacheOverWriter(const void *key, size_t klen, void *value, void *ud) {
×
925
  SLastCol *pLastCol = (SLastCol *)value;
×
926
  pLastCol->dirty = 0;
×
927
}
×
928

929
static int32_t tsdbCachePutToLRU(STsdb *pTsdb, SLastKey *pLastKey, SLastCol *pLastCol, int8_t dirty);
930

931
static int32_t tsdbCacheNewTableColumn(STsdb *pTsdb, int64_t uid, int16_t cid, int8_t col_type, int8_t lflag) {
×
932
  int32_t code = 0, lino = 0;
×
933

934
  SLRUCache *pCache = pTsdb->lruCache;
×
935
  // rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
936
  SRowKey  emptyRowKey = {.ts = TSKEY_MIN, .numOfPKs = 0};
×
937
  SLastCol emptyCol = {
×
938
      .rowKey = emptyRowKey, .colVal = COL_VAL_NONE(cid, col_type), .dirty = 1, .cacheStatus = TSDB_LAST_CACHE_VALID};
939

940
  SLastKey *pLastKey = &(SLastKey){.lflag = lflag, .uid = uid, .cid = cid};
×
941
  code = tsdbCachePutToLRU(pTsdb, pLastKey, &emptyCol, 1);
×
942
  if (code) {
×
943
    tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
944
  }
945

946
  TAOS_RETURN(code);
×
947
}
948

949
int32_t tsdbCacheCommitNoLock(STsdb *pTsdb) {
8✔
950
  int32_t code = 0;
8✔
951
  char   *err = NULL;
8✔
952

953
  SLRUCache *pCache = pTsdb->lruCache;
8✔
954
  // rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
955

956
  taosLRUCacheApply(pCache, tsdbCacheFlushDirty, pTsdb);
8✔
957
#ifdef USE_ROCKSDB
958
  rocksMayWrite(pTsdb, true);
8✔
959
  rocksdb_flush(pTsdb->rCache.db, pTsdb->rCache.flushoptions, &err);
8✔
960
  if (NULL != err) {
8✔
961
    tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, err);
×
962
    rocksdb_free(err);
×
963
    code = TSDB_CODE_FAILED;
×
964
  }
965
#endif
966
  TAOS_RETURN(code);
8✔
967
}
968

969
static int32_t tsdbCacheGetValuesFromRocks(STsdb *pTsdb, size_t numKeys, const char *const *ppKeysList,
×
970
                                           size_t *pKeysListSizes, char ***pppValuesList, size_t **ppValuesListSizes) {
971
#ifdef USE_ROCKSDB
972
  char **valuesList = taosMemoryCalloc(numKeys, sizeof(char *));
×
973
  if (!valuesList) return terrno;
×
974
  size_t *valuesListSizes = taosMemoryCalloc(numKeys, sizeof(size_t));
×
975
  if (!valuesListSizes) {
×
976
    taosMemoryFreeClear(valuesList);
×
977
    return terrno;
×
978
  }
979
  char **errs = taosMemoryCalloc(numKeys, sizeof(char *));
×
980
  if (!errs) {
×
981
    taosMemoryFreeClear(valuesList);
×
982
    taosMemoryFreeClear(valuesListSizes);
×
983
    return terrno;
×
984
  }
985
  rocksdb_multi_get(pTsdb->rCache.db, pTsdb->rCache.readoptions, numKeys, ppKeysList, pKeysListSizes, valuesList,
×
986
                    valuesListSizes, errs);
987
  for (size_t i = 0; i < numKeys; ++i) {
×
988
    rocksdb_free(errs[i]);
×
989
  }
990
  taosMemoryFreeClear(errs);
×
991

992
  *pppValuesList = valuesList;
×
993
  *ppValuesListSizes = valuesListSizes;
×
994
#endif
995
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
996
}
997

998
static int32_t tsdbCacheDropTableColumn(STsdb *pTsdb, int64_t uid, int16_t cid, bool hasPrimaryKey) {
×
999
  int32_t code = 0;
×
1000

1001
  // build keys & multi get from rocks
1002
  char **keys_list = taosMemoryCalloc(2, sizeof(char *));
×
1003
  if (!keys_list) {
×
1004
    return terrno;
×
1005
  }
1006
  size_t *keys_list_sizes = taosMemoryCalloc(2, sizeof(size_t));
×
1007
  if (!keys_list_sizes) {
×
1008
    taosMemoryFree(keys_list);
×
1009
    return terrno;
×
1010
  }
1011
  const size_t klen = ROCKS_KEY_LEN;
×
1012

1013
  char *keys = taosMemoryCalloc(2, sizeof(SLastKey));
×
1014
  if (!keys) {
×
1015
    taosMemoryFree(keys_list);
×
1016
    taosMemoryFree(keys_list_sizes);
×
1017
    return terrno;
×
1018
  }
1019
  ((SLastKey *)keys)[0] = (SLastKey){.lflag = LFLAG_LAST, .uid = uid, .cid = cid};
×
1020
  ((SLastKey *)keys)[1] = (SLastKey){.lflag = LFLAG_LAST_ROW, .uid = uid, .cid = cid};
×
1021

1022
  keys_list[0] = keys;
×
1023
  keys_list[1] = keys + sizeof(SLastKey);
×
1024
  keys_list_sizes[0] = klen;
×
1025
  keys_list_sizes[1] = klen;
×
1026

1027
  char  **values_list = NULL;
×
1028
  size_t *values_list_sizes = NULL;
×
1029

1030
  // was written by caller
1031
  // rocksMayWrite(pTsdb, true); // flush writebatch cache
1032

1033
  TAOS_CHECK_GOTO(tsdbCacheGetValuesFromRocks(pTsdb, 2, (const char *const *)keys_list, keys_list_sizes, &values_list,
×
1034
                                              &values_list_sizes),
1035
                  NULL, _exit);
1036
#ifdef USE_ROCKSDB
1037
  rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
×
1038
#endif
1039
  {
1040
#ifdef USE_ROCKSDB
1041
    SLastCol *pLastCol = NULL;
×
1042
    if (values_list[0] != NULL) {
×
1043
      code = tsdbCacheDeserialize(values_list[0], values_list_sizes[0], &pLastCol);
×
1044
      if (code != TSDB_CODE_SUCCESS) {
×
1045
        tsdbError("vgId:%d, %s deserialize failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1046
                  tstrerror(code));
1047
        goto _exit;
×
1048
      }
1049
      if (NULL != pLastCol) {
×
1050
        rocksdb_writebatch_delete(wb, keys_list[0], klen);
×
1051
      }
1052
      taosMemoryFreeClear(pLastCol);
×
1053
    }
1054

1055
    pLastCol = NULL;
×
1056
    if (values_list[1] != NULL) {
×
1057
      code = tsdbCacheDeserialize(values_list[1], values_list_sizes[1], &pLastCol);
×
1058
      if (code != TSDB_CODE_SUCCESS) {
×
1059
        tsdbError("vgId:%d, %s deserialize failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1060
                  tstrerror(code));
1061
        goto _exit;
×
1062
      }
1063
      if (NULL != pLastCol) {
×
1064
        rocksdb_writebatch_delete(wb, keys_list[1], klen);
×
1065
      }
1066
      taosMemoryFreeClear(pLastCol);
×
1067
    }
1068

1069
    rocksdb_free(values_list[0]);
×
1070
    rocksdb_free(values_list[1]);
×
1071
#endif
1072

1073
    for (int i = 0; i < 2; i++) {
×
1074
      LRUHandle *h = taosLRUCacheLookup(pTsdb->lruCache, keys_list[i], klen);
×
1075
      if (h) {
×
1076
        tsdbLRUCacheRelease(pTsdb->lruCache, h, true);
×
1077
        taosLRUCacheErase(pTsdb->lruCache, keys_list[i], klen);
×
1078
      }
1079
    }
1080
  }
1081

1082
_exit:
×
1083
  taosMemoryFree(keys_list[0]);
×
1084

1085
  taosMemoryFree(keys_list);
×
1086
  taosMemoryFree(keys_list_sizes);
×
1087
  taosMemoryFree(values_list);
×
1088
  taosMemoryFree(values_list_sizes);
×
1089

1090
  TAOS_RETURN(code);
×
1091
}
1092

1093
int32_t tsdbCacheNewTable(STsdb *pTsdb, tb_uid_t uid, tb_uid_t suid, const SSchemaWrapper *pSchemaRow) {
×
1094
  int32_t code = 0;
×
1095

1096
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1097

1098
  if (suid < 0) {
×
1099
    for (int i = 0; i < pSchemaRow->nCols; ++i) {
×
1100
      int16_t cid = pSchemaRow->pSchema[i].colId;
×
1101
      int8_t  col_type = pSchemaRow->pSchema[i].type;
×
1102

1103
      code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, LFLAG_LAST_ROW);
×
1104
      if (code != TSDB_CODE_SUCCESS) {
×
1105
        tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1106
                  tstrerror(code));
1107
      }
1108
      code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, LFLAG_LAST);
×
1109
      if (code != TSDB_CODE_SUCCESS) {
×
1110
        tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1111
                  tstrerror(code));
1112
      }
1113
    }
1114
  } else {
1115
    STSchema *pTSchema = NULL;
×
1116
    code = metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, uid, -1, &pTSchema);
×
1117
    if (code != TSDB_CODE_SUCCESS) {
×
1118
      (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1119

1120
      TAOS_RETURN(code);
×
1121
    }
1122

1123
    for (int i = 0; i < pTSchema->numOfCols; ++i) {
×
1124
      int16_t cid = pTSchema->columns[i].colId;
×
1125
      int8_t  col_type = pTSchema->columns[i].type;
×
1126

1127
      code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, LFLAG_LAST_ROW);
×
1128
      if (code != TSDB_CODE_SUCCESS) {
×
1129
        tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1130
                  tstrerror(code));
1131
      }
1132
      code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, LFLAG_LAST);
×
1133
      if (code != TSDB_CODE_SUCCESS) {
×
1134
        tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1135
                  tstrerror(code));
1136
      }
1137
    }
1138

1139
    taosMemoryFree(pTSchema);
×
1140
  }
1141

1142
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1143

1144
  TAOS_RETURN(code);
×
1145
}
1146

1147
int32_t tsdbCacheDropTable(STsdb *pTsdb, tb_uid_t uid, tb_uid_t suid, SSchemaWrapper *pSchemaRow) {
×
1148
  int32_t code = 0;
×
1149

1150
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1151

1152
  code = tsdbCacheCommitNoLock(pTsdb);
×
1153
  if (code != TSDB_CODE_SUCCESS) {
×
1154
    tsdbTrace("vgId:%d, %s commit with no lock failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1155
              tstrerror(code));
1156
  }
1157

1158
  if (pSchemaRow != NULL) {
×
1159
    bool hasPrimayKey = false;
×
1160
    int  nCols = pSchemaRow->nCols;
×
1161
    if (nCols >= 2) {
×
1162
      hasPrimayKey = (pSchemaRow->pSchema[1].flags & COL_IS_KEY) ? true : false;
×
1163
    }
1164
    for (int i = 0; i < nCols; ++i) {
×
1165
      int16_t cid = pSchemaRow->pSchema[i].colId;
×
1166
      int8_t  col_type = pSchemaRow->pSchema[i].type;
×
1167

1168
      code = tsdbCacheDropTableColumn(pTsdb, uid, cid, hasPrimayKey);
×
1169
      if (code != TSDB_CODE_SUCCESS) {
×
1170
        tsdbTrace("vgId:%d, %s drop table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1171
                  tstrerror(code));
1172
      }
1173
    }
1174
  } else {
1175
    STSchema *pTSchema = NULL;
×
1176
    code = metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, uid, -1, &pTSchema);
×
1177
    if (code != TSDB_CODE_SUCCESS) {
×
1178
      (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1179

1180
      TAOS_RETURN(code);
×
1181
    }
1182

1183
    bool hasPrimayKey = false;
×
1184
    int  nCols = pTSchema->numOfCols;
×
1185
    if (nCols >= 2) {
×
1186
      hasPrimayKey = (pTSchema->columns[1].flags & COL_IS_KEY) ? true : false;
×
1187
    }
1188
    for (int i = 0; i < nCols; ++i) {
×
1189
      int16_t cid = pTSchema->columns[i].colId;
×
1190
      int8_t  col_type = pTSchema->columns[i].type;
×
1191

1192
      code = tsdbCacheDropTableColumn(pTsdb, uid, cid, hasPrimayKey);
×
1193
      if (code != TSDB_CODE_SUCCESS) {
×
1194
        tsdbTrace("vgId:%d, %s drop table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1195
                  tstrerror(code));
1196
      }
1197
    }
1198

1199
    taosMemoryFree(pTSchema);
×
1200
  }
1201

1202
  rocksMayWrite(pTsdb, false);
×
1203

1204
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1205

1206
  TAOS_RETURN(code);
×
1207
}
1208

1209
int32_t tsdbCacheDropSubTables(STsdb *pTsdb, SArray *uids, tb_uid_t suid) {
8✔
1210
  int32_t code = 0;
8✔
1211

1212
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
8✔
1213

1214
  code = tsdbCacheCommitNoLock(pTsdb);
8✔
1215
  if (code != TSDB_CODE_SUCCESS) {
8✔
1216
    tsdbTrace("vgId:%d, %s commit with no lock failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1217
              tstrerror(code));
1218
  }
1219

1220
  STSchema *pTSchema = NULL;
8✔
1221
  code = metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, suid, -1, &pTSchema);
8✔
1222
  if (code != TSDB_CODE_SUCCESS) {
8✔
1223
    (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1224

1225
    TAOS_RETURN(code);
×
1226
  }
1227

1228
  for (int i = 0; i < TARRAY_SIZE(uids); ++i) {
8✔
1229
    int64_t uid = ((tb_uid_t *)TARRAY_DATA(uids))[i];
×
1230

1231
    bool hasPrimayKey = false;
×
1232
    int  nCols = pTSchema->numOfCols;
×
1233
    if (nCols >= 2) {
×
1234
      hasPrimayKey = (pTSchema->columns[1].flags & COL_IS_KEY) ? true : false;
×
1235
    }
1236

1237
    for (int i = 0; i < nCols; ++i) {
×
1238
      int16_t cid = pTSchema->columns[i].colId;
×
1239
      int8_t  col_type = pTSchema->columns[i].type;
×
1240

1241
      code = tsdbCacheDropTableColumn(pTsdb, uid, cid, hasPrimayKey);
×
1242
      if (code != TSDB_CODE_SUCCESS) {
×
1243
        tsdbTrace("vgId:%d, %s drop table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1244
                  tstrerror(code));
1245
      }
1246
    }
1247
  }
1248

1249
  taosMemoryFree(pTSchema);
8✔
1250

1251
  rocksMayWrite(pTsdb, false);
8✔
1252

1253
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
8✔
1254

1255
  TAOS_RETURN(code);
8✔
1256
}
1257

1258
int32_t tsdbCacheNewNTableColumn(STsdb *pTsdb, int64_t uid, int16_t cid, int8_t col_type) {
×
1259
  int32_t code = 0;
×
1260

1261
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1262

1263
  code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, 0);
×
1264
  if (code != TSDB_CODE_SUCCESS) {
×
1265
    tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1266
              tstrerror(code));
1267
  }
1268
  code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, 1);
×
1269
  if (code != TSDB_CODE_SUCCESS) {
×
1270
    tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1271
              tstrerror(code));
1272
  }
1273
  // rocksMayWrite(pTsdb, true, false, false);
1274
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1275

1276
  TAOS_RETURN(code);
×
1277
}
1278

1279
int32_t tsdbCacheDropNTableColumn(STsdb *pTsdb, int64_t uid, int16_t cid, bool hasPrimayKey) {
×
1280
  int32_t code = 0;
×
1281

1282
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1283

1284
  code = tsdbCacheCommitNoLock(pTsdb);
×
1285
  if (code != TSDB_CODE_SUCCESS) {
×
1286
    tsdbTrace("vgId:%d, %s commit with no lock failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1287
              tstrerror(code));
1288
  }
1289

1290
  code = tsdbCacheDropTableColumn(pTsdb, uid, cid, hasPrimayKey);
×
1291
  if (code != TSDB_CODE_SUCCESS) {
×
1292
    tsdbTrace("vgId:%d, %s drop table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1293
              tstrerror(code));
1294
  }
1295

1296
  rocksMayWrite(pTsdb, false);
×
1297

1298
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1299

1300
  TAOS_RETURN(code);
×
1301
}
1302

1303
int32_t tsdbCacheNewSTableColumn(STsdb *pTsdb, SArray *uids, int16_t cid, int8_t col_type) {
×
1304
  int32_t code = 0;
×
1305

1306
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1307

1308
  for (int i = 0; i < TARRAY_SIZE(uids); ++i) {
×
1309
    tb_uid_t uid = ((tb_uid_t *)TARRAY_DATA(uids))[i];
×
1310

1311
    code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, 0);
×
1312
    if (code != TSDB_CODE_SUCCESS) {
×
1313
      tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1314
                tstrerror(code));
1315
    }
1316
    code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, 1);
×
1317
    if (code != TSDB_CODE_SUCCESS) {
×
1318
      tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1319
                tstrerror(code));
1320
    }
1321
  }
1322

1323
  // rocksMayWrite(pTsdb, true, false, false);
1324
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1325
  TAOS_RETURN(code);
×
1326
}
1327

1328
int32_t tsdbCacheDropSTableColumn(STsdb *pTsdb, SArray *uids, int16_t cid, bool hasPrimayKey) {
×
1329
  int32_t code = 0;
×
1330

1331
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1332

1333
  code = tsdbCacheCommitNoLock(pTsdb);
×
1334
  if (code != TSDB_CODE_SUCCESS) {
×
1335
    tsdbTrace("vgId:%d, %s commit with no lock failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1336
              tstrerror(code));
1337
  }
1338

1339
  for (int i = 0; i < TARRAY_SIZE(uids); ++i) {
×
1340
    int64_t uid = ((tb_uid_t *)TARRAY_DATA(uids))[i];
×
1341

1342
    code = tsdbCacheDropTableColumn(pTsdb, uid, cid, hasPrimayKey);
×
1343
    if (code != TSDB_CODE_SUCCESS) {
×
1344
      tsdbTrace("vgId:%d, %s drop table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1345
                tstrerror(code));
1346
    }
1347
  }
1348

1349
  rocksMayWrite(pTsdb, false);
×
1350

1351
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1352

1353
  TAOS_RETURN(code);
×
1354
}
1355

1356
typedef struct {
1357
  int      idx;
1358
  SLastKey key;
1359
} SIdxKey;
1360

1361
static void tsdbCacheUpdateLastColToNone(SLastCol *pLastCol, ELastCacheStatus cacheStatus) {
×
1362
  // update rowkey
1363
  pLastCol->rowKey.ts = TSKEY_MIN;
×
1364
  for (int8_t i = 0; i < pLastCol->rowKey.numOfPKs; i++) {
×
1365
    SValue *pPKValue = &pLastCol->rowKey.pks[i];
×
1366
    if (IS_VAR_DATA_TYPE(pPKValue->type) && pPKValue->nData > 0) {
×
1367
      taosMemoryFreeClear(pPKValue->pData);
×
1368
      pPKValue->nData = 0;
×
1369
    } else {
1370
      valueClearDatum(pPKValue, pPKValue->type);
×
1371
    }
1372
  }
1373
  pLastCol->rowKey.numOfPKs = 0;
×
1374

1375
  // update colval
1376
  if (IS_VAR_DATA_TYPE(pLastCol->colVal.value.type) && pLastCol->colVal.value.nData > 0) {
×
1377
    taosMemoryFreeClear(pLastCol->colVal.value.pData);
×
1378
    pLastCol->colVal.value.nData = 0;
×
1379
  } else {
1380
    valueClearDatum(&pLastCol->colVal.value, pLastCol->colVal.value.type);
×
1381
  }
1382

1383
  pLastCol->colVal = COL_VAL_NONE(pLastCol->colVal.cid, pLastCol->colVal.value.type);
×
1384
  pLastCol->dirty = 1;
×
1385
  pLastCol->cacheStatus = cacheStatus;
×
1386
}
×
1387

1388
static int32_t tsdbCachePutToRocksdb(STsdb *pTsdb, SLastKey *pLastKey, SLastCol *pLastCol) {
×
1389
  int32_t code = 0;
×
1390
#ifdef USE_ROCKSDB
1391
  char  *rocks_value = NULL;
×
1392
  size_t vlen = 0;
×
1393

1394
  code = tsdbCacheSerialize(pLastCol, &rocks_value, &vlen);
×
1395
  if (code) {
×
1396
    tsdbError("tsdb/cache/putrocks: vgId:%d, serialize failed since %s.", TD_VID(pTsdb->pVnode), tstrerror(code));
×
1397
    TAOS_RETURN(code);
×
1398
  }
1399

1400
  rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
×
1401
  (void)taosThreadMutexLock(&pTsdb->rCache.writeBatchMutex);
×
1402
  rocksdb_writebatch_put(wb, (char *)pLastKey, ROCKS_KEY_LEN, rocks_value, vlen);
×
1403
  (void)taosThreadMutexUnlock(&pTsdb->rCache.writeBatchMutex);
×
1404

1405
  taosMemoryFree(rocks_value);
×
1406
#endif
1407
  TAOS_RETURN(code);
×
1408
}
1409

1410
static int32_t tsdbCachePutToLRU(STsdb *pTsdb, SLastKey *pLastKey, SLastCol *pLastCol, int8_t dirty) {
×
1411
  int32_t code = 0, lino = 0;
×
1412

1413
  SLastCol *pLRULastCol = taosMemoryCalloc(1, sizeof(SLastCol));
×
1414
  if (!pLRULastCol) {
×
1415
    return terrno;
×
1416
  }
1417

1418
  size_t charge = 0;
×
1419
  *pLRULastCol = *pLastCol;
×
1420
  pLRULastCol->dirty = dirty;
×
1421
  TAOS_CHECK_EXIT(tsdbCacheReallocSLastCol(pLRULastCol, &charge));
×
1422

1423
  LRUStatus status = taosLRUCacheInsert(pTsdb->lruCache, pLastKey, ROCKS_KEY_LEN, pLRULastCol, charge, tsdbCacheDeleter,
×
1424
                                        tsdbCacheOverWriter, NULL, TAOS_LRU_PRIORITY_LOW, pTsdb);
1425
  if (TAOS_LRU_STATUS_OK != status && TAOS_LRU_STATUS_OK_OVERWRITTEN != status) {
×
1426
    tsdbError("vgId:%d, %s failed at line %d status %d.", TD_VID(pTsdb->pVnode), __func__, __LINE__, status);
×
1427
    code = TSDB_CODE_FAILED;
×
1428
    pLRULastCol = NULL;
×
1429
  }
1430

1431
_exit:
×
1432
  if (TSDB_CODE_SUCCESS != code) {
×
1433
    taosMemoryFree(pLRULastCol);
×
1434
    tsdbError("tsdb/cache/putlru: vgId:%d, failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino, tstrerror(code));
×
1435
  }
1436

1437
  TAOS_RETURN(code);
×
1438
}
1439

1440
static int32_t tsdbCacheUpdate(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, SArray *updCtxArray) {
×
1441
  if (!updCtxArray || TARRAY_SIZE(updCtxArray) == 0) {
×
1442
    TAOS_RETURN(TSDB_CODE_SUCCESS);
×
1443
  }
1444

1445
  int32_t code = 0, lino = 0;
×
1446

1447
  int        num_keys = TARRAY_SIZE(updCtxArray);
×
1448
  SArray    *remainCols = NULL;
×
1449
  SLRUCache *pCache = pTsdb->lruCache;
×
1450

1451
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1452
  for (int i = 0; i < num_keys; ++i) {
×
1453
    SLastUpdateCtx *updCtx = &((SLastUpdateCtx *)TARRAY_DATA(updCtxArray))[i];
×
1454
    int8_t          lflag = updCtx->lflag;
×
1455
    SRowKey        *pRowKey = &updCtx->tsdbRowKey.key;
×
1456
    SColVal        *pColVal = &updCtx->colVal;
×
1457

1458
    if (lflag == LFLAG_LAST && !COL_VAL_IS_VALUE(pColVal)) {
×
1459
      continue;
×
1460
    }
1461

1462
    SLastKey  *key = &(SLastKey){.lflag = lflag, .uid = uid, .cid = pColVal->cid};
×
1463
    LRUHandle *h = taosLRUCacheLookup(pCache, key, ROCKS_KEY_LEN);
×
1464
    if (h) {
×
1465
      SLastCol *pLastCol = (SLastCol *)taosLRUCacheValue(pCache, h);
×
1466
      if (pLastCol->cacheStatus != TSDB_LAST_CACHE_NO_CACHE) {
×
1467
        int32_t cmp_res = tRowKeyCompare(&pLastCol->rowKey, pRowKey);
×
1468
        if (cmp_res < 0 || (cmp_res == 0 && !COL_VAL_IS_NONE(pColVal))) {
×
1469
          SLastCol newLastCol = {
×
1470
              .rowKey = *pRowKey, .colVal = *pColVal, .dirty = 1, .cacheStatus = TSDB_LAST_CACHE_VALID};
1471
          code = tsdbCachePutToLRU(pTsdb, key, &newLastCol, 1);
×
1472
        }
1473
      }
1474

1475
      tsdbLRUCacheRelease(pCache, h, false);
×
1476
      TAOS_CHECK_EXIT(code);
×
1477
    } else {
1478
      if (!remainCols) {
×
1479
        remainCols = taosArrayInit(num_keys * 2, sizeof(SIdxKey));
×
1480
        if (!remainCols) {
×
1481
          TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1482
        }
1483
      }
1484
      if (!taosArrayPush(remainCols, &(SIdxKey){i, *key})) {
×
1485
        TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1486
      }
1487
    }
1488
  }
1489

1490
  if (remainCols) {
×
1491
    num_keys = TARRAY_SIZE(remainCols);
×
1492
  }
1493
  if (remainCols && num_keys > 0) {
×
1494
    char  **keys_list = NULL;
×
1495
    size_t *keys_list_sizes = NULL;
×
1496
    char  **values_list = NULL;
×
1497
    size_t *values_list_sizes = NULL;
×
1498
    char  **errs = NULL;
×
1499
    keys_list = taosMemoryCalloc(num_keys, sizeof(char *));
×
1500
    if (!keys_list) {
×
1501
      (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1502
      return terrno;
×
1503
    }
1504
    keys_list_sizes = taosMemoryCalloc(num_keys, sizeof(size_t));
×
1505
    if (!keys_list_sizes) {
×
1506
      taosMemoryFree(keys_list);
×
1507
      (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1508
      return terrno;
×
1509
    }
1510
    for (int i = 0; i < num_keys; ++i) {
×
1511
      SIdxKey *idxKey = &((SIdxKey *)TARRAY_DATA(remainCols))[i];
×
1512

1513
      keys_list[i] = (char *)&idxKey->key;
×
1514
      keys_list_sizes[i] = ROCKS_KEY_LEN;
×
1515
    }
1516

1517
    rocksMayWrite(pTsdb, true);  // flush writebatch cache
×
1518

1519
    code = tsdbCacheGetValuesFromRocks(pTsdb, num_keys, (const char *const *)keys_list, keys_list_sizes, &values_list,
×
1520
                                       &values_list_sizes);
1521
    if (code) {
×
1522
      taosMemoryFree(keys_list);
×
1523
      taosMemoryFree(keys_list_sizes);
×
1524
      goto _exit;
×
1525
    }
1526

1527
    // rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
1528
    for (int i = 0; i < num_keys; ++i) {
×
1529
      SIdxKey        *idxKey = &((SIdxKey *)TARRAY_DATA(remainCols))[i];
×
1530
      SLastUpdateCtx *updCtx = (SLastUpdateCtx *)taosArrayGet(updCtxArray, idxKey->idx);
×
1531
      SRowKey        *pRowKey = &updCtx->tsdbRowKey.key;
×
1532
      SColVal        *pColVal = &updCtx->colVal;
×
1533

1534
      SLastCol *pLastCol = NULL;
×
1535
      if (values_list[i] != NULL) {
×
1536
        code = tsdbCacheDeserialize(values_list[i], values_list_sizes[i], &pLastCol);
×
1537
        if (code != TSDB_CODE_SUCCESS) {
×
1538
          tsdbError("vgId:%d, %s deserialize failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1539
                    tstrerror(code));
1540
          goto _exit;
×
1541
        }
1542
      }
1543
      /*
1544
      if (code) {
1545
        tsdbError("tsdb/cache: vgId:%d, deserialize failed since %s.", TD_VID(pTsdb->pVnode), tstrerror(code));
1546
      }
1547
      */
1548
      SLastCol *pToFree = pLastCol;
×
1549

1550
      if (pLastCol && pLastCol->cacheStatus == TSDB_LAST_CACHE_NO_CACHE) {
×
1551
        if ((code = tsdbCachePutToLRU(pTsdb, &idxKey->key, pLastCol, 0)) != TSDB_CODE_SUCCESS) {
×
1552
          tsdbError("tsdb/cache: vgId:%d, put lru failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino,
×
1553
                    tstrerror(code));
1554
          taosMemoryFreeClear(pToFree);
×
1555
          break;
×
1556
        }
1557

1558
        // cache invalid => skip update
1559
        taosMemoryFreeClear(pToFree);
×
1560
        continue;
×
1561
      }
1562

1563
      if (IS_LAST_KEY(idxKey->key) && !COL_VAL_IS_VALUE(pColVal)) {
×
1564
        taosMemoryFreeClear(pToFree);
×
1565
        continue;
×
1566
      }
1567

1568
      int32_t cmp_res = 1;
×
1569
      if (pLastCol) {
×
1570
        cmp_res = tRowKeyCompare(&pLastCol->rowKey, pRowKey);
×
1571
      }
1572

1573
      if (NULL == pLastCol || cmp_res < 0 || (cmp_res == 0 && !COL_VAL_IS_NONE(pColVal))) {
×
1574
        SLastCol lastColTmp = {
×
1575
            .rowKey = *pRowKey, .colVal = *pColVal, .dirty = 0, .cacheStatus = TSDB_LAST_CACHE_VALID};
1576
        if ((code = tsdbCachePutToRocksdb(pTsdb, &idxKey->key, &lastColTmp)) != TSDB_CODE_SUCCESS) {
×
1577
          tsdbError("tsdb/cache: vgId:%d, put rocks failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino,
×
1578
                    tstrerror(code));
1579
          taosMemoryFreeClear(pToFree);
×
1580
          break;
×
1581
        }
1582
        if ((code = tsdbCachePutToLRU(pTsdb, &idxKey->key, &lastColTmp, 0)) != TSDB_CODE_SUCCESS) {
×
1583
          tsdbError("tsdb/cache: vgId:%d, put lru failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino,
×
1584
                    tstrerror(code));
1585
          taosMemoryFreeClear(pToFree);
×
1586
          break;
×
1587
        }
1588
      }
1589

1590
      taosMemoryFreeClear(pToFree);
×
1591
    }
1592

1593
    rocksMayWrite(pTsdb, false);
×
1594

1595
    taosMemoryFree(keys_list);
×
1596
    taosMemoryFree(keys_list_sizes);
×
1597
    if (values_list) {
×
1598
#ifdef USE_ROCKSDB
1599
      for (int i = 0; i < num_keys; ++i) {
×
1600
        rocksdb_free(values_list[i]);
×
1601
      }
1602
#endif
1603
      taosMemoryFree(values_list);
×
1604
    }
1605
    taosMemoryFree(values_list_sizes);
×
1606
  }
1607

1608
_exit:
×
1609
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1610
  taosArrayDestroy(remainCols);
×
1611

1612
  if (code) {
×
1613
    tsdbError("tsdb/cache: vgId:%d, update failed at line %d since %s.", TD_VID(pTsdb->pVnode), __LINE__,
×
1614
              tstrerror(code));
1615
  }
1616

1617
  TAOS_RETURN(code);
×
1618
}
1619

1620
int32_t tsdbCacheRowFormatUpdate(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, int64_t version, int32_t nRow,
×
1621
                                 SRow **aRow) {
1622
  int32_t code = 0, lino = 0;
×
1623

1624
  // 1. prepare last
1625
  TSDBROW      lRow = {.type = TSDBROW_ROW_FMT, .pTSRow = aRow[nRow - 1], .version = version};
×
1626
  STSchema    *pTSchema = NULL;
×
1627
  int32_t      sver = TSDBROW_SVERSION(&lRow);
×
1628
  SSHashObj   *iColHash = NULL;
×
1629
  STSDBRowIter iter = {0};
×
1630

1631
  TAOS_CHECK_GOTO(tsdbUpdateSkm(pTsdb, suid, uid, sver), &lino, _exit);
×
1632
  pTSchema = pTsdb->rCache.pTSchema;
×
1633

1634
  TSDBROW tRow = {.type = TSDBROW_ROW_FMT, .version = version};
×
1635
  int32_t nCol = pTSchema->numOfCols;
×
1636
  SArray *ctxArray = pTsdb->rCache.ctxArray;
×
1637

1638
  // 1. prepare by lrow
1639
  STsdbRowKey tsdbRowKey = {0};
×
1640
  tsdbRowGetKey(&lRow, &tsdbRowKey);
×
1641

1642
  TAOS_CHECK_GOTO(tsdbRowIterOpen(&iter, &lRow, pTSchema), &lino, _exit);
×
1643

1644
  int32_t iCol = 0;
×
1645
  for (SColVal *pColVal = tsdbRowIterNext(&iter); pColVal && iCol < nCol; pColVal = tsdbRowIterNext(&iter), iCol++) {
×
1646
    SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST_ROW, .tsdbRowKey = tsdbRowKey, .colVal = *pColVal};
×
1647
    if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1648
      TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1649
    }
1650

1651
    if (COL_VAL_IS_VALUE(pColVal)) {
×
1652
      updateCtx.lflag = LFLAG_LAST;
×
1653
      if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1654
        TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1655
      }
1656
    } else {
1657
      if (!iColHash) {
×
1658
        iColHash = tSimpleHashInit(16, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT));
×
1659
        if (iColHash == NULL) {
×
1660
          TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _exit);
×
1661
        }
1662
      }
1663

1664
      if (tSimpleHashPut(iColHash, &iCol, sizeof(iCol), NULL, 0)) {
×
1665
        TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _exit);
×
1666
      }
1667
    }
1668
  }
1669

1670
  // 2. prepare by the other rows
1671
  for (int32_t iRow = nRow - 2; iRow >= 0; --iRow) {
×
1672
    if (tSimpleHashGetSize(iColHash) == 0) {
×
1673
      break;
×
1674
    }
1675

1676
    tRow.pTSRow = aRow[iRow];
×
1677

1678
    STsdbRowKey tsdbRowKey = {0};
×
1679
    tsdbRowGetKey(&tRow, &tsdbRowKey);
×
1680

1681
    void   *pIte = NULL;
×
1682
    int32_t iter = 0;
×
1683
    while ((pIte = tSimpleHashIterate(iColHash, pIte, &iter)) != NULL) {
×
1684
      int32_t iCol = ((int32_t *)pIte)[0];
×
1685
      SColVal colVal = COL_VAL_NONE(0, 0);
×
1686
      tsdbRowGetColVal(&tRow, pTSchema, iCol, &colVal);
×
1687

1688
      if (COL_VAL_IS_VALUE(&colVal)) {
×
1689
        SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST, .tsdbRowKey = tsdbRowKey, .colVal = colVal};
×
1690
        if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1691
          TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1692
        }
1693
        code = tSimpleHashIterateRemove(iColHash, &iCol, sizeof(iCol), &pIte, &iter);
×
1694
        if (code != TSDB_CODE_SUCCESS) {
×
1695
          tsdbTrace("vgId:%d, %s tSimpleHashIterateRemove failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__,
×
1696
                    __LINE__, tstrerror(code));
1697
        }
1698
      }
1699
    }
1700
  }
1701

1702
  TAOS_CHECK_GOTO(tsdbCacheUpdate(pTsdb, suid, uid, ctxArray), &lino, _exit);
×
1703

1704
_exit:
×
1705
  if (code) {
×
1706
    tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
1707
  }
1708

1709
  tsdbRowClose(&iter);
×
1710
  tSimpleHashCleanup(iColHash);
×
1711
  taosArrayClear(ctxArray);
×
1712

1713
  TAOS_RETURN(code);
×
1714
}
1715

1716
int32_t tsdbCacheColFormatUpdate(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, SBlockData *pBlockData) {
×
1717
  int32_t      code = 0, lino = 0;
×
1718
  STSDBRowIter iter = {0};
×
1719
  STSchema    *pTSchema = NULL;
×
1720
  SArray      *ctxArray = NULL;
×
1721

1722
  TSDBROW lRow = tsdbRowFromBlockData(pBlockData, pBlockData->nRow - 1);
×
1723
  int32_t sver = TSDBROW_SVERSION(&lRow);
×
1724

1725
  TAOS_CHECK_RETURN(metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, uid, sver, &pTSchema));
×
1726

1727
  ctxArray = taosArrayInit(pBlockData->nColData, sizeof(SLastUpdateCtx));
×
1728
  if (ctxArray == NULL) {
×
1729
    TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1730
  }
1731

1732
  // 1. prepare last
1733
  STsdbRowKey tsdbRowKey = {0};
×
1734
  tsdbRowGetKey(&lRow, &tsdbRowKey);
×
1735

1736
  {
1737
    SValue tsVal = {.type = TSDB_DATA_TYPE_TIMESTAMP};
×
1738
    VALUE_SET_TRIVIAL_DATUM(&tsVal, lRow.pBlockData->aTSKEY[lRow.iRow]);
×
1739
    SLastUpdateCtx updateCtx = {
×
1740
        .lflag = LFLAG_LAST, .tsdbRowKey = tsdbRowKey, .colVal = COL_VAL_VALUE(PRIMARYKEY_TIMESTAMP_COL_ID, tsVal)};
1741
    if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1742
      TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1743
    }
1744
  }
1745

1746
  TSDBROW tRow = tsdbRowFromBlockData(pBlockData, 0);
×
1747

1748
  for (int32_t iColData = 0; iColData < pBlockData->nColData; ++iColData) {
×
1749
    SColData *pColData = &pBlockData->aColData[iColData];
×
1750
    if ((pColData->flag & HAS_VALUE) != HAS_VALUE) {
×
1751
      continue;
×
1752
    }
1753

1754
    for (tRow.iRow = pBlockData->nRow - 1; tRow.iRow >= 0; --tRow.iRow) {
×
1755
      STsdbRowKey tsdbRowKey = {0};
×
1756
      tsdbRowGetKey(&tRow, &tsdbRowKey);
×
1757

1758
      uint8_t colType = tColDataGetBitValue(pColData, tRow.iRow);
×
1759
      if (colType == 2) {
×
1760
        SColVal colVal = COL_VAL_NONE(pColData->cid, pColData->type);
×
1761
        TAOS_CHECK_GOTO(tColDataGetValue(pColData, tRow.iRow, &colVal), &lino, _exit);
×
1762

1763
        SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST, .tsdbRowKey = tsdbRowKey, .colVal = colVal};
×
1764
        if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1765
          TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1766
        }
1767
        break;
×
1768
      }
1769
    }
1770
  }
1771

1772
  // 2. prepare last row
1773
  TAOS_CHECK_GOTO(tsdbRowIterOpen(&iter, &lRow, pTSchema), &lino, _exit);
×
1774
  for (SColVal *pColVal = tsdbRowIterNext(&iter); pColVal; pColVal = tsdbRowIterNext(&iter)) {
×
1775
    SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST_ROW, .tsdbRowKey = tsdbRowKey, .colVal = *pColVal};
×
1776
    if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1777
      TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1778
    }
1779
  }
1780

1781
  TAOS_CHECK_GOTO(tsdbCacheUpdate(pTsdb, suid, uid, ctxArray), &lino, _exit);
×
1782

1783
_exit:
×
1784
  tsdbRowClose(&iter);
×
1785
  taosMemoryFreeClear(pTSchema);
×
1786
  taosArrayDestroy(ctxArray);
×
1787

1788
  TAOS_RETURN(code);
×
1789
}
1790

1791
static int32_t mergeLastCid(tb_uid_t uid, STsdb *pTsdb, SArray **ppLastArray, SCacheRowsReader *pr, int16_t *aCols,
1792
                            int nCols, int16_t *slotIds);
1793

1794
static int32_t mergeLastRowCid(tb_uid_t uid, STsdb *pTsdb, SArray **ppLastArray, SCacheRowsReader *pr, int16_t *aCols,
1795
                               int nCols, int16_t *slotIds);
1796

1797
static int32_t tsdbCacheLoadFromRaw(STsdb *pTsdb, tb_uid_t uid, SArray *pLastArray, SArray *remainCols,
×
1798
                                    SCacheRowsReader *pr, int8_t ltype) {
1799
  int32_t code = 0, lino = 0;
×
1800
  // rocksdb_writebatch_t *wb = NULL;
1801
  SArray *pTmpColArray = NULL;
×
1802
  bool    extraTS = false;
×
1803

1804
  SIdxKey *idxKey = taosArrayGet(remainCols, 0);
×
1805
  if (idxKey->key.cid != PRIMARYKEY_TIMESTAMP_COL_ID) {
×
1806
    // ignore 'ts' loaded from cache and load it from tsdb
1807
    // SLastCol *pLastCol = taosArrayGet(pLastArray, 0);
1808
    // tsdbCacheUpdateLastColToNone(pLastCol, TSDB_LAST_CACHE_NO_CACHE);
1809

1810
    SLastKey *key = &(SLastKey){.lflag = ltype, .uid = uid, .cid = PRIMARYKEY_TIMESTAMP_COL_ID};
×
1811
    if (!taosArrayInsert(remainCols, 0, &(SIdxKey){0, *key})) {
×
1812
      TAOS_RETURN(terrno);
×
1813
    }
1814

1815
    extraTS = true;
×
1816
  }
1817

1818
  int      num_keys = TARRAY_SIZE(remainCols);
×
1819
  int16_t *slotIds = taosMemoryMalloc(num_keys * sizeof(int16_t));
×
1820

1821
  int16_t *lastColIds = NULL, *lastSlotIds = NULL, *lastrowColIds = NULL, *lastrowSlotIds = NULL;
×
1822
  lastColIds = taosMemoryMalloc(num_keys * sizeof(int16_t));
×
1823
  lastSlotIds = taosMemoryMalloc(num_keys * sizeof(int16_t));
×
1824
  lastrowColIds = taosMemoryMalloc(num_keys * sizeof(int16_t));
×
1825
  lastrowSlotIds = taosMemoryMalloc(num_keys * sizeof(int16_t));
×
1826
  SArray *lastTmpColArray = NULL, *lastTmpIndexArray = NULL, *lastrowTmpColArray = NULL, *lastrowTmpIndexArray = NULL;
×
1827

1828
  int lastIndex = 0;
×
1829
  int lastrowIndex = 0;
×
1830

1831
  if (!slotIds || !lastColIds || !lastSlotIds || !lastrowColIds || !lastrowSlotIds) {
×
1832
    TAOS_CHECK_EXIT(terrno);
×
1833
  }
1834

1835
  for (int i = 0; i < num_keys; ++i) {
×
1836
    SIdxKey *idxKey = taosArrayGet(remainCols, i);
×
1837
    if (extraTS && !i) {
×
1838
      slotIds[i] = 0;
×
1839
    } else {
1840
      slotIds[i] = pr->pSlotIds[idxKey->idx];
×
1841
    }
1842

1843
    if (IS_LAST_KEY(idxKey->key)) {
×
1844
      if (NULL == lastTmpIndexArray) {
×
1845
        lastTmpIndexArray = taosArrayInit(num_keys, sizeof(int32_t));
×
1846
        if (!lastTmpIndexArray) {
×
1847
          TAOS_CHECK_EXIT(terrno);
×
1848
        }
1849
      }
1850
      if (!taosArrayPush(lastTmpIndexArray, &(i))) {
×
1851
        TAOS_CHECK_EXIT(terrno);
×
1852
      }
1853
      lastColIds[lastIndex] = idxKey->key.cid;
×
1854
      if (extraTS && !i) {
×
1855
        lastSlotIds[lastIndex] = 0;
×
1856
      } else {
1857
        lastSlotIds[lastIndex] = pr->pSlotIds[idxKey->idx];
×
1858
      }
1859
      lastIndex++;
×
1860
    } else {
1861
      if (NULL == lastrowTmpIndexArray) {
×
1862
        lastrowTmpIndexArray = taosArrayInit(num_keys, sizeof(int32_t));
×
1863
        if (!lastrowTmpIndexArray) {
×
1864
          TAOS_CHECK_EXIT(terrno);
×
1865
        }
1866
      }
1867
      if (!taosArrayPush(lastrowTmpIndexArray, &(i))) {
×
1868
        TAOS_CHECK_EXIT(terrno);
×
1869
      }
1870
      lastrowColIds[lastrowIndex] = idxKey->key.cid;
×
1871
      if (extraTS && !i) {
×
1872
        lastrowSlotIds[lastrowIndex] = 0;
×
1873
      } else {
1874
        lastrowSlotIds[lastrowIndex] = pr->pSlotIds[idxKey->idx];
×
1875
      }
1876
      lastrowIndex++;
×
1877
    }
1878
  }
1879

1880
  pTmpColArray = taosArrayInit(lastIndex + lastrowIndex, sizeof(SLastCol));
×
1881
  if (!pTmpColArray) {
×
1882
    TAOS_CHECK_EXIT(terrno);
×
1883
  }
1884

1885
  if (lastTmpIndexArray != NULL) {
×
1886
    TAOS_CHECK_EXIT(mergeLastCid(uid, pTsdb, &lastTmpColArray, pr, lastColIds, lastIndex, lastSlotIds));
×
1887
    for (int i = 0; i < taosArrayGetSize(lastTmpColArray); i++) {
×
1888
      if (!taosArrayInsert(pTmpColArray, *(int32_t *)taosArrayGet(lastTmpIndexArray, i),
×
1889
                           taosArrayGet(lastTmpColArray, i))) {
×
1890
        TAOS_CHECK_EXIT(terrno);
×
1891
      }
1892
    }
1893
  }
1894

1895
  if (lastrowTmpIndexArray != NULL) {
×
1896
    TAOS_CHECK_EXIT(mergeLastRowCid(uid, pTsdb, &lastrowTmpColArray, pr, lastrowColIds, lastrowIndex, lastrowSlotIds));
×
1897
    for (int i = 0; i < taosArrayGetSize(lastrowTmpColArray); i++) {
×
1898
      if (!taosArrayInsert(pTmpColArray, *(int32_t *)taosArrayGet(lastrowTmpIndexArray, i),
×
1899
                           taosArrayGet(lastrowTmpColArray, i))) {
×
1900
        TAOS_CHECK_EXIT(terrno);
×
1901
      }
1902
    }
1903
  }
1904

1905
  SLRUCache *pCache = pTsdb->lruCache;
×
1906
  for (int i = 0; i < num_keys; ++i) {
×
1907
    SIdxKey  *idxKey = taosArrayGet(remainCols, i);
×
1908
    SLastCol *pLastCol = NULL;
×
1909

1910
    if (pTmpColArray && TARRAY_SIZE(pTmpColArray) >= i + 1) {
×
1911
      pLastCol = taosArrayGet(pTmpColArray, i);
×
1912
    }
1913

1914
    // still null, then make up a none col value
1915
    SLastCol noneCol = {.rowKey.ts = TSKEY_MIN,
×
1916
                        .colVal = COL_VAL_NONE(idxKey->key.cid, pr->pSchema->columns[slotIds[i]].type),
×
1917
                        .cacheStatus = TSDB_LAST_CACHE_VALID};
1918
    if (!pLastCol) {
×
1919
      pLastCol = &noneCol;
×
1920
    }
1921

1922
    if (!extraTS || i > 0) {
×
1923
      tsdbDebug("vgId:%d, %s qid:%s uid:%" PRId64 " from tsdb, col_id:%d col_flag:%d ts:%" PRId64,
×
1924
                TD_VID(pTsdb->pVnode), __func__, pr && pr->idstr ? pr->idstr : "null", uid, pLastCol->colVal.cid,
1925
                pLastCol->colVal.flag, pLastCol->rowKey.ts);
1926
      taosArraySet(pLastArray, idxKey->idx, pLastCol);
×
1927
    }
1928

1929
    // taosArrayRemove(remainCols, i);
1930

1931
    if (/*!pTmpColArray*/ lastTmpIndexArray && !lastTmpColArray) {
×
1932
      continue;
×
1933
    }
1934
    if (/*!pTmpColArray*/ lastrowTmpIndexArray && !lastrowTmpColArray) {
×
1935
      continue;
×
1936
    }
1937

1938
    // store result back to rocks cache
1939
    code = tsdbCachePutToRocksdb(pTsdb, &idxKey->key, pLastCol);
×
1940
    if (code) {
×
1941
      tsdbError("vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
1942
      TAOS_CHECK_EXIT(code);
×
1943
    }
1944

1945
    code = tsdbCachePutToLRU(pTsdb, &idxKey->key, pLastCol, 0);
×
1946
    if (code) {
×
1947
      tsdbError("vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
1948
      TAOS_CHECK_EXIT(code);
×
1949
    }
1950

1951
    if (extraTS && i == 0) {
×
1952
      tsdbCacheFreeSLastColItem(pLastCol);
×
1953
    }
1954
  }
1955

1956
  rocksMayWrite(pTsdb, false);
×
1957

1958
_exit:
×
1959
  taosArrayDestroy(lastrowTmpIndexArray);
×
1960
  taosArrayDestroy(lastrowTmpColArray);
×
1961
  taosArrayDestroy(lastTmpIndexArray);
×
1962
  taosArrayDestroy(lastTmpColArray);
×
1963

1964
  taosMemoryFree(lastColIds);
×
1965
  taosMemoryFree(lastSlotIds);
×
1966
  taosMemoryFree(lastrowColIds);
×
1967
  taosMemoryFree(lastrowSlotIds);
×
1968

1969
  taosArrayDestroy(pTmpColArray);
×
1970

1971
  taosMemoryFree(slotIds);
×
1972

1973
  TAOS_RETURN(code);
×
1974
}
1975

1976
static int32_t tsdbCacheLoadFromRocks(STsdb *pTsdb, tb_uid_t uid, SArray *pLastArray, SArray *remainCols,
×
1977
                                      SArray *ignoreFromRocks, SCacheRowsReader *pr, int8_t ltype) {
1978
  int32_t code = 0, lino = 0;
×
1979
  int     num_keys = TARRAY_SIZE(remainCols);
×
1980
  char  **keys_list = taosMemoryMalloc(num_keys * sizeof(char *));
×
1981
  size_t *keys_list_sizes = taosMemoryMalloc(num_keys * sizeof(size_t));
×
1982
  char   *key_list = taosMemoryMalloc(num_keys * ROCKS_KEY_LEN);
×
1983
  if (!keys_list || !keys_list_sizes || !key_list) {
×
1984
    taosMemoryFree(keys_list);
×
1985
    taosMemoryFree(keys_list_sizes);
×
1986
    TAOS_RETURN(terrno);
×
1987
  }
1988
  char  **values_list = NULL;
×
1989
  size_t *values_list_sizes = NULL;
×
1990
  for (int i = 0; i < num_keys; ++i) {
×
1991
    memcpy(key_list + i * ROCKS_KEY_LEN, &((SIdxKey *)taosArrayGet(remainCols, i))->key, ROCKS_KEY_LEN);
×
1992
    keys_list[i] = key_list + i * ROCKS_KEY_LEN;
×
1993
    keys_list_sizes[i] = ROCKS_KEY_LEN;
×
1994
  }
1995

1996
  rocksMayWrite(pTsdb, true);  // flush writebatch cache
×
1997

1998
  code = tsdbCacheGetValuesFromRocks(pTsdb, num_keys, (const char *const *)keys_list, keys_list_sizes, &values_list,
×
1999
                                     &values_list_sizes);
2000
  if (code) {
×
2001
    taosMemoryFree(key_list);
×
2002
    taosMemoryFree(keys_list);
×
2003
    taosMemoryFree(keys_list_sizes);
×
2004
    TAOS_RETURN(code);
×
2005
  }
2006

2007
  SLRUCache *pCache = pTsdb->lruCache;
×
2008
  for (int i = 0, j = 0; i < num_keys && j < TARRAY_SIZE(remainCols); ++i) {
×
2009
    SLastCol *pLastCol = NULL;
×
2010
    bool      ignore = ((bool *)TARRAY_DATA(ignoreFromRocks))[i];
×
2011
    if (ignore) {
×
2012
      ++j;
×
2013
      continue;
×
2014
    }
2015

2016
    if (values_list[i] != NULL) {
×
2017
      code = tsdbCacheDeserialize(values_list[i], values_list_sizes[i], &pLastCol);
×
2018
      if (code != TSDB_CODE_SUCCESS) {
×
2019
        tsdbError("vgId:%d, %s deserialize failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
2020
                  tstrerror(code));
2021
        goto _exit;
×
2022
      }
2023
    }
2024
    SLastCol *pToFree = pLastCol;
×
2025
    SIdxKey  *idxKey = &((SIdxKey *)TARRAY_DATA(remainCols))[j];
×
2026
    if (pLastCol && pLastCol->cacheStatus != TSDB_LAST_CACHE_NO_CACHE) {
×
2027
      code = tsdbCachePutToLRU(pTsdb, &idxKey->key, pLastCol, 0);
×
2028
      if (code) {
×
2029
        tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
2030
        taosMemoryFreeClear(pToFree);
×
2031
        TAOS_CHECK_EXIT(code);
×
2032
      }
2033

2034
      SLastCol lastCol = *pLastCol;
×
2035
      code = tsdbCacheReallocSLastCol(&lastCol, NULL);
×
2036
      if (TSDB_CODE_SUCCESS != code) {
×
2037
        taosMemoryFreeClear(pToFree);
×
2038
        TAOS_CHECK_EXIT(code);
×
2039
      }
2040

2041
      tsdbDebug("vgId:%d, %s qid:%s uid:%" PRId64 " from rocksdb, col_id:%d col_flag:%d ts:%" PRId64,
×
2042
                TD_VID(pTsdb->pVnode), __func__, pr && pr->idstr ? pr->idstr : "null", uid, lastCol.colVal.cid,
2043
                lastCol.colVal.flag, lastCol.rowKey.ts);
2044

2045
      taosArraySet(pLastArray, idxKey->idx, &lastCol);
×
2046
      taosArrayRemove(remainCols, j);
×
2047
      taosArrayRemove(ignoreFromRocks, j);
×
2048
    } else {
2049
      ++j;
×
2050
    }
2051

2052
    taosMemoryFreeClear(pToFree);
×
2053
  }
2054

2055
  if (TARRAY_SIZE(remainCols) > 0) {
×
2056
    // tsdbTrace("tsdb/cache: vgId: %d, load %" PRId64 " from raw", TD_VID(pTsdb->pVnode), uid);
2057
    code = tsdbCacheLoadFromRaw(pTsdb, uid, pLastArray, remainCols, pr, ltype);
×
2058
  }
2059

2060
_exit:
×
2061
  taosMemoryFree(key_list);
×
2062
  taosMemoryFree(keys_list);
×
2063
  taosMemoryFree(keys_list_sizes);
×
2064
  if (values_list) {
×
2065
#ifdef USE_ROCKSDB
2066
    for (int i = 0; i < num_keys; ++i) {
×
2067
      rocksdb_free(values_list[i]);
×
2068
    }
2069
#endif
2070
    taosMemoryFree(values_list);
×
2071
  }
2072
  taosMemoryFree(values_list_sizes);
×
2073

2074
  TAOS_RETURN(code);
×
2075
}
2076

2077
static int32_t tsdbCacheGetBatchFromLru(STsdb *pTsdb, tb_uid_t uid, SArray *pLastArray, SCacheRowsReader *pr,
×
2078
                                        int8_t ltype, SArray *keyArray) {
2079
  int32_t    code = 0, lino = 0;
×
2080
  SArray    *remainCols = NULL;
×
2081
  SArray    *ignoreFromRocks = NULL;
×
2082
  SLRUCache *pCache = pTsdb->lruCache;
×
2083
  SArray    *pCidList = pr->pCidList;
×
2084
  int        numKeys = TARRAY_SIZE(pCidList);
×
2085

2086
  for (int i = 0; i < numKeys; ++i) {
×
2087
    int16_t cid = ((int16_t *)TARRAY_DATA(pCidList))[i];
×
2088

2089
    SLastKey key = {.lflag = ltype, .uid = uid, .cid = cid};
×
2090
    // for select last_row, last case
2091
    int32_t funcType = FUNCTION_TYPE_CACHE_LAST;
×
2092
    if (pr->pFuncTypeList != NULL && taosArrayGetSize(pr->pFuncTypeList) > i) {
×
2093
      funcType = ((int32_t *)TARRAY_DATA(pr->pFuncTypeList))[i];
×
2094
    }
2095
    if (((pr->type & CACHESCAN_RETRIEVE_LAST) == CACHESCAN_RETRIEVE_LAST) && FUNCTION_TYPE_CACHE_LAST_ROW == funcType) {
×
2096
      int8_t tempType = CACHESCAN_RETRIEVE_LAST_ROW | (pr->type ^ CACHESCAN_RETRIEVE_LAST);
×
2097
      key.lflag = (tempType & CACHESCAN_RETRIEVE_LAST) >> 3;
×
2098
    }
2099

2100
    if (!taosArrayPush(keyArray, &key)) {
×
2101
      TAOS_CHECK_EXIT(terrno);
×
2102
    }
2103

2104
    LRUHandle *h = taosLRUCacheLookup(pCache, &key, ROCKS_KEY_LEN);
×
2105
    SLastCol  *pLastCol = h ? (SLastCol *)taosLRUCacheValue(pCache, h) : NULL;
×
2106
    if (h && pLastCol->cacheStatus != TSDB_LAST_CACHE_NO_CACHE) {
×
2107
      SLastCol lastCol = *pLastCol;
×
2108
      if (TSDB_CODE_SUCCESS != (code = tsdbCacheReallocSLastCol(&lastCol, NULL))) {
×
2109
        tsdbLRUCacheRelease(pCache, h, false);
×
2110
        TAOS_CHECK_GOTO(code, NULL, _exit);
×
2111
      }
2112

2113
      tsdbDebug("vgId:%d, %s qid:%s uid:%" PRId64 " from lru, col_id:%d col_flag:%d ts:%" PRId64, TD_VID(pTsdb->pVnode),
×
2114
                __func__, pr && pr->idstr ? pr->idstr : "null", uid, lastCol.colVal.cid, lastCol.colVal.flag,
2115
                lastCol.rowKey.ts);
2116

2117
      if (taosArrayPush(pLastArray, &lastCol) == NULL) {
×
2118
        code = terrno;
×
2119
        tsdbLRUCacheRelease(pCache, h, false);
×
2120
        goto _exit;
×
2121
      }
2122
    } else {
2123
      // no cache or cache is invalid
2124
      SLastCol noneCol = {.rowKey.ts = TSKEY_MIN,
×
2125
                          .colVal = COL_VAL_NONE(cid, pr->pSchema->columns[pr->pSlotIds[i]].type)};
×
2126

2127
      if (taosArrayPush(pLastArray, &noneCol) == NULL) {
×
2128
        code = terrno;
×
2129
        tsdbLRUCacheRelease(pCache, h, false);
×
2130
        goto _exit;
×
2131
      }
2132

2133
      if (!remainCols) {
×
2134
        if ((remainCols = taosArrayInit(numKeys, sizeof(SIdxKey))) == NULL) {
×
2135
          code = terrno;
×
2136
          tsdbLRUCacheRelease(pCache, h, false);
×
2137
          goto _exit;
×
2138
        }
2139
      }
2140
      if (!ignoreFromRocks) {
×
2141
        if ((ignoreFromRocks = taosArrayInit(numKeys, sizeof(bool))) == NULL) {
×
2142
          code = terrno;
×
2143
          tsdbLRUCacheRelease(pCache, h, false);
×
2144
          goto _exit;
×
2145
        }
2146
      }
2147
      if (taosArrayPush(remainCols, &(SIdxKey){i, key}) == NULL) {
×
2148
        code = terrno;
×
2149
        tsdbLRUCacheRelease(pCache, h, false);
×
2150
        goto _exit;
×
2151
      }
2152
      bool ignoreRocks = pLastCol ? (pLastCol->cacheStatus == TSDB_LAST_CACHE_NO_CACHE) : false;
×
2153
      if (taosArrayPush(ignoreFromRocks, &ignoreRocks) == NULL) {
×
2154
        code = terrno;
×
2155
        tsdbLRUCacheRelease(pCache, h, false);
×
2156
        goto _exit;
×
2157
      }
2158
    }
2159

2160
    if (h) {
×
2161
      tsdbLRUCacheRelease(pCache, h, false);
×
2162
    }
2163
  }
2164

2165
  if (remainCols && TARRAY_SIZE(remainCols) > 0) {
×
2166
    (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
2167

2168
    for (int i = 0; i < TARRAY_SIZE(remainCols);) {
×
2169
      SIdxKey   *idxKey = &((SIdxKey *)TARRAY_DATA(remainCols))[i];
×
2170
      LRUHandle *h = taosLRUCacheLookup(pCache, &idxKey->key, ROCKS_KEY_LEN);
×
2171
      SLastCol  *pLastCol = h ? (SLastCol *)taosLRUCacheValue(pCache, h) : NULL;
×
2172
      if (h && pLastCol->cacheStatus != TSDB_LAST_CACHE_NO_CACHE) {
×
2173
        SLastCol lastCol = *pLastCol;
×
2174
        code = tsdbCacheReallocSLastCol(&lastCol, NULL);
×
2175
        if (code) {
×
2176
          tsdbLRUCacheRelease(pCache, h, false);
×
2177
          (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
2178
          TAOS_RETURN(code);
×
2179
        }
2180

2181
        tsdbDebug("vgId:%d, %s qid:%s uid:%" PRId64 " from lru(2nd lookup), col_id:%d col_flag:%d ts:%" PRId64,
×
2182
                  TD_VID(pTsdb->pVnode), __func__, pr && pr->idstr ? pr->idstr : "null", uid, lastCol.colVal.cid,
2183
                  lastCol.colVal.flag, lastCol.rowKey.ts);
2184

2185
        taosArraySet(pLastArray, idxKey->idx, &lastCol);
×
2186

2187
        taosArrayRemove(remainCols, i);
×
2188
        taosArrayRemove(ignoreFromRocks, i);
×
2189
      } else {
2190
        // no cache or cache is invalid
2191
        ++i;
×
2192
      }
2193
      if (h) {
×
2194
        tsdbLRUCacheRelease(pCache, h, false);
×
2195
      }
2196
    }
2197

2198
    // tsdbTrace("tsdb/cache: vgId: %d, load %" PRId64 " from rocks", TD_VID(pTsdb->pVnode), uid);
2199
    code = tsdbCacheLoadFromRocks(pTsdb, uid, pLastArray, remainCols, ignoreFromRocks, pr, ltype);
×
2200

2201
    (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
2202
  }
2203

2204
_exit:
×
2205
  if (remainCols) {
×
2206
    taosArrayDestroy(remainCols);
×
2207
  }
2208
  if (ignoreFromRocks) {
×
2209
    taosArrayDestroy(ignoreFromRocks);
×
2210
  }
2211

2212
  TAOS_RETURN(code);
×
2213
}
2214

2215
typedef enum SMEMNEXTROWSTATES {
2216
  SMEMNEXTROW_ENTER,
2217
  SMEMNEXTROW_NEXT,
2218
} SMEMNEXTROWSTATES;
2219

2220
typedef struct SMemNextRowIter {
2221
  SMEMNEXTROWSTATES state;
2222
  STbData          *pMem;  // [input]
2223
  STbDataIter       iter;  // mem buffer skip list iterator
2224
  int64_t           lastTs;
2225
} SMemNextRowIter;
2226

2227
static int32_t getNextRowFromMem(void *iter, TSDBROW **ppRow, bool *pIgnoreEarlierTs, bool isLast, int16_t *aCols,
×
2228
                                 int nCols) {
2229
  SMemNextRowIter *state = (SMemNextRowIter *)iter;
×
2230
  int32_t          code = 0;
×
2231
  *pIgnoreEarlierTs = false;
×
2232
  switch (state->state) {
×
2233
    case SMEMNEXTROW_ENTER: {
×
2234
      if (state->pMem != NULL) {
×
2235
        /*
2236
        if (state->pMem->maxKey <= state->lastTs) {
2237
          *ppRow = NULL;
2238
          *pIgnoreEarlierTs = true;
2239

2240
          TAOS_RETURN(code);
2241
        }
2242
        */
2243
        tsdbTbDataIterOpen(state->pMem, NULL, 1, &state->iter);
×
2244

2245
        TSDBROW *pMemRow = tsdbTbDataIterGet(&state->iter);
×
2246
        if (pMemRow) {
×
2247
          *ppRow = pMemRow;
×
2248
          state->state = SMEMNEXTROW_NEXT;
×
2249

2250
          TAOS_RETURN(code);
×
2251
        }
2252
      }
2253

2254
      *ppRow = NULL;
×
2255

2256
      TAOS_RETURN(code);
×
2257
    }
2258
    case SMEMNEXTROW_NEXT:
×
2259
      if (tsdbTbDataIterNext(&state->iter)) {
×
2260
        *ppRow = tsdbTbDataIterGet(&state->iter);
×
2261

2262
        TAOS_RETURN(code);
×
2263
      } else {
2264
        *ppRow = NULL;
×
2265

2266
        TAOS_RETURN(code);
×
2267
      }
2268
    default:
×
2269
      break;
×
2270
  }
2271

2272
_err:
×
2273
  *ppRow = NULL;
×
2274

2275
  TAOS_RETURN(code);
×
2276
}
2277

2278
typedef int32_t (*_next_row_fn_t)(void *iter, TSDBROW **ppRow, bool *pIgnoreEarlierTs, bool isLast, int16_t *aCols,
2279
                                  int nCols);
2280
typedef int32_t (*_next_row_clear_fn_t)(void *iter);
2281

2282
typedef struct {
2283
  TSDBROW             *pRow;
2284
  bool                 stop;
2285
  bool                 next;
2286
  bool                 ignoreEarlierTs;
2287
  void                *iter;
2288
  _next_row_fn_t       nextRowFn;
2289
  _next_row_clear_fn_t nextRowClearFn;
2290
} TsdbNextRowState;
2291

2292
typedef struct {
2293
  SArray           *pMemDelData;
2294
  SArray           *pSkyline;
2295
  int64_t           iSkyline;
2296
  SBlockIdx         idx;
2297
  SMemNextRowIter   memState;
2298
  SMemNextRowIter   imemState;
2299
  TSDBROW           memRow, imemRow;
2300
  TsdbNextRowState  input[2];
2301
  SCacheRowsReader *pr;
2302
  STsdb            *pTsdb;
2303
} MemNextRowIter;
2304

2305
static int32_t memRowIterOpen(MemNextRowIter *pIter, tb_uid_t uid, STsdb *pTsdb, STSchema *pTSchema, tb_uid_t suid,
×
2306
                              STsdbReadSnap *pReadSnap, SCacheRowsReader *pr) {
2307
  int32_t code = 0, lino = 0;
×
2308

2309
  STbData *pMem = NULL;
×
2310
  if (pReadSnap->pMem) {
×
2311
    pMem = tsdbGetTbDataFromMemTable(pReadSnap->pMem, suid, uid);
×
2312
  }
2313

2314
  STbData *pIMem = NULL;
×
2315
  if (pReadSnap->pIMem) {
×
2316
    pIMem = tsdbGetTbDataFromMemTable(pReadSnap->pIMem, suid, uid);
×
2317
  }
2318

2319
  pIter->pTsdb = pTsdb;
×
2320

2321
  pIter->pMemDelData = NULL;
×
2322

2323
  TAOS_CHECK_GOTO(loadMemTombData(&pIter->pMemDelData, pMem, pIMem, pr->info.verRange.maxVer), &lino, _exit);
×
2324

2325
  pIter->idx = (SBlockIdx){.suid = suid, .uid = uid};
×
2326

2327
  pIter->input[0] = (TsdbNextRowState){&pIter->memRow, true, false, false, &pIter->memState, getNextRowFromMem, NULL};
×
2328
  pIter->input[1] = (TsdbNextRowState){&pIter->imemRow, true, false, false, &pIter->imemState, getNextRowFromMem, NULL};
×
2329

2330
  if (pMem) {
×
2331
    pIter->memState.pMem = pMem;
×
2332
    pIter->memState.state = SMEMNEXTROW_ENTER;
×
2333
    pIter->input[0].stop = false;
×
2334
    pIter->input[0].next = true;
×
2335
  }
2336

2337
  if (pIMem) {
×
2338
    pIter->imemState.pMem = pIMem;
×
2339
    pIter->imemState.state = SMEMNEXTROW_ENTER;
×
2340
    pIter->input[1].stop = false;
×
2341
    pIter->input[1].next = true;
×
2342
  }
2343

2344
  pIter->pr = pr;
×
2345

2346
_exit:
×
2347
  if (code) {
×
2348
    tsdbError("tsdb/cache: %s failed at line %d since %s.", __func__, lino, tstrerror(code));
×
2349
  }
2350

2351
  TAOS_RETURN(code);
×
2352
}
2353

2354
static void memRowIterClose(MemNextRowIter *pIter) {
×
2355
  for (int i = 0; i < 2; ++i) {
×
2356
    if (pIter->input[i].nextRowClearFn) {
×
2357
      (void)pIter->input[i].nextRowClearFn(pIter->input[i].iter);
×
2358
    }
2359
  }
2360

2361
  if (pIter->pSkyline) {
×
2362
    taosArrayDestroy(pIter->pSkyline);
×
2363
  }
2364

2365
  if (pIter->pMemDelData) {
×
2366
    taosArrayDestroy(pIter->pMemDelData);
×
2367
  }
2368
}
×
2369

2370
static void freeTableInfoFunc(void *param) {
×
2371
  void **p = (void **)param;
×
2372
  taosMemoryFreeClear(*p);
×
2373
}
×
2374

2375
static STableLoadInfo *getTableLoadInfo(SCacheRowsReader *pReader, uint64_t uid) {
×
2376
  if (!pReader->pTableMap) {
×
2377
    pReader->pTableMap = tSimpleHashInit(pReader->numOfTables, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT));
×
2378
    if (!pReader->pTableMap) {
×
2379
      return NULL;
×
2380
    }
2381

2382
    tSimpleHashSetFreeFp(pReader->pTableMap, freeTableInfoFunc);
×
2383
  }
2384

2385
  STableLoadInfo  *pInfo = NULL;
×
2386
  STableLoadInfo **ppInfo = tSimpleHashGet(pReader->pTableMap, &uid, sizeof(uid));
×
2387
  if (!ppInfo) {
×
2388
    pInfo = taosMemoryCalloc(1, sizeof(STableLoadInfo));
×
2389
    if (pInfo) {
×
2390
      if (tSimpleHashPut(pReader->pTableMap, &uid, sizeof(uint64_t), &pInfo, POINTER_BYTES)) {
×
2391
        return NULL;
×
2392
      }
2393
    }
2394

2395
    return pInfo;
×
2396
  }
2397

2398
  return *ppInfo;
×
2399
}
2400

2401
static TSDBROW *memRowIterGet(MemNextRowIter *pIter, bool isLast, int16_t *aCols, int nCols) {
×
2402
  int32_t code = 0, lino = 0;
×
2403

2404
  for (;;) {
×
2405
    for (int i = 0; i < 2; ++i) {
×
2406
      if (pIter->input[i].next && !pIter->input[i].stop) {
×
2407
        TAOS_CHECK_GOTO(pIter->input[i].nextRowFn(pIter->input[i].iter, &pIter->input[i].pRow,
×
2408
                                                  &pIter->input[i].ignoreEarlierTs, isLast, aCols, nCols),
2409
                        &lino, _exit);
2410

2411
        if (pIter->input[i].pRow == NULL) {
×
2412
          pIter->input[i].stop = true;
×
2413
          pIter->input[i].next = false;
×
2414
        }
2415
      }
2416
    }
2417

2418
    if (pIter->input[0].stop && pIter->input[1].stop) {
×
2419
      return NULL;
×
2420
    }
2421

2422
    TSDBROW *max[2] = {0};
×
2423
    int      iMax[2] = {-1, -1};
×
2424
    int      nMax = 0;
×
2425
    SRowKey  maxKey = {.ts = TSKEY_MIN};
×
2426

2427
    for (int i = 0; i < 2; ++i) {
×
2428
      if (!pIter->input[i].stop && pIter->input[i].pRow != NULL) {
×
2429
        STsdbRowKey tsdbRowKey = {0};
×
2430
        tsdbRowGetKey(pIter->input[i].pRow, &tsdbRowKey);
×
2431

2432
        // merging & deduplicating on client side
2433
        int c = tRowKeyCompare(&maxKey, &tsdbRowKey.key);
×
2434
        if (c <= 0) {
×
2435
          if (c < 0) {
×
2436
            nMax = 0;
×
2437
            maxKey = tsdbRowKey.key;
×
2438
          }
2439

2440
          iMax[nMax] = i;
×
2441
          max[nMax++] = pIter->input[i].pRow;
×
2442
        }
2443
        pIter->input[i].next = false;
×
2444
      }
2445
    }
2446

2447
    TSDBROW *merge[2] = {0};
×
2448
    int      iMerge[2] = {-1, -1};
×
2449
    int      nMerge = 0;
×
2450
    for (int i = 0; i < nMax; ++i) {
×
2451
      TSDBKEY maxKey1 = TSDBROW_KEY(max[i]);
×
2452

2453
      if (!pIter->pSkyline) {
×
2454
        pIter->pSkyline = taosArrayInit(32, sizeof(TSDBKEY));
×
2455
        TSDB_CHECK_NULL(pIter->pSkyline, code, lino, _exit, terrno);
×
2456

2457
        uint64_t        uid = pIter->idx.uid;
×
2458
        STableLoadInfo *pInfo = getTableLoadInfo(pIter->pr, uid);
×
2459
        TSDB_CHECK_NULL(pInfo, code, lino, _exit, TSDB_CODE_OUT_OF_MEMORY);
×
2460

2461
        if (pInfo->pTombData == NULL) {
×
2462
          pInfo->pTombData = taosArrayInit(4, sizeof(SDelData));
×
2463
          TSDB_CHECK_NULL(pInfo->pTombData, code, lino, _exit, terrno);
×
2464
        }
2465

2466
        if (!taosArrayAddAll(pInfo->pTombData, pIter->pMemDelData)) {
×
2467
          TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
2468
        }
2469

2470
        size_t delSize = TARRAY_SIZE(pInfo->pTombData);
×
2471
        if (delSize > 0) {
×
2472
          code = tsdbBuildDeleteSkyline(pInfo->pTombData, 0, (int32_t)(delSize - 1), pIter->pSkyline);
×
2473
          TAOS_CHECK_GOTO(code, &lino, _exit);
×
2474
        }
2475
        pIter->iSkyline = taosArrayGetSize(pIter->pSkyline) - 1;
×
2476
      }
2477

2478
      bool deleted = tsdbKeyDeleted(&maxKey1, pIter->pSkyline, &pIter->iSkyline);
×
2479
      if (!deleted) {
×
2480
        iMerge[nMerge] = iMax[i];
×
2481
        merge[nMerge++] = max[i];
×
2482
      }
2483

2484
      pIter->input[iMax[i]].next = deleted;
×
2485
    }
2486

2487
    if (nMerge > 0) {
×
2488
      pIter->input[iMerge[0]].next = true;
×
2489

2490
      return merge[0];
×
2491
    }
2492
  }
2493

2494
_exit:
×
2495
  if (code) {
×
2496
    tsdbError("tsdb/cache: %s failed at line %d since %s.", __func__, lino, tstrerror(code));
×
2497
  }
2498

2499
  return NULL;
×
2500
}
2501

2502
static int32_t cloneTSchema(STSchema *pSrc, STSchema **ppDst) {
×
2503
  int32_t len = sizeof(STSchema) + sizeof(STColumn) * pSrc->numOfCols;
×
2504
  *ppDst = taosMemoryMalloc(len);
×
2505
  if (NULL == *ppDst) {
×
2506
    TAOS_RETURN(terrno);
×
2507
  }
2508
  memcpy(*ppDst, pSrc, len);
×
2509

2510
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
2511
}
2512

2513
static int32_t updateTSchema(int32_t sversion, SCacheRowsReader *pReader, uint64_t uid) {
×
2514
  if (NULL == pReader->pCurrSchema && sversion == pReader->pSchema->version) {
×
2515
    TAOS_RETURN(cloneTSchema(pReader->pSchema, &pReader->pCurrSchema));
×
2516
  }
2517

2518
  if (NULL != pReader->pCurrSchema && sversion == pReader->pCurrSchema->version) {
×
2519
    TAOS_RETURN(TSDB_CODE_SUCCESS);
×
2520
  }
2521

2522
  taosMemoryFreeClear(pReader->pCurrSchema);
×
2523
  TAOS_RETURN(
×
2524
      metaGetTbTSchemaEx(pReader->pTsdb->pVnode->pMeta, pReader->info.suid, uid, sversion, &pReader->pCurrSchema));
2525
}
2526

2527
static int32_t tsdbCacheGetBatchFromMem(STsdb *pTsdb, tb_uid_t uid, SArray *pLastArray, SCacheRowsReader *pr,
×
2528
                                        SArray *keyArray) {
2529
  int32_t        code = 0;
×
2530
  int32_t        lino = 0;
×
2531
  STSchema      *pTSchema = pr->pSchema;
×
2532
  SLRUCache     *pCache = pTsdb->lruCache;
×
2533
  SArray        *pCidList = pr->pCidList;
×
2534
  int            numKeys = TARRAY_SIZE(pCidList);
×
2535
  MemNextRowIter iter = {0};
×
2536
  SSHashObj     *iColHash = NULL;
×
2537
  STSDBRowIter   rowIter = {0};
×
2538

2539
  // 1, get from mem, imem filtered with delete info
2540
  TAOS_CHECK_EXIT(memRowIterOpen(&iter, uid, pTsdb, pTSchema, pr->info.suid, pr->pReadSnap, pr));
×
2541

2542
  TSDBROW *pRow = memRowIterGet(&iter, false, NULL, 0);
×
2543
  if (!pRow) {
×
2544
    goto _exit;
×
2545
  }
2546

2547
  int32_t sversion = TSDBROW_SVERSION(pRow);
×
2548
  if (sversion != -1) {
×
2549
    TAOS_CHECK_EXIT(updateTSchema(sversion, pr, uid));
×
2550

2551
    pTSchema = pr->pCurrSchema;
×
2552
  }
2553
  int32_t nCol = pTSchema->numOfCols;
×
2554

2555
  STsdbRowKey rowKey = {0};
×
2556
  tsdbRowGetKey(pRow, &rowKey);
×
2557

2558
  TAOS_CHECK_EXIT(tsdbRowIterOpen(&rowIter, pRow, pTSchema));
×
2559

2560
  int32_t iCol = 0, jCol = 0, jnCol = TARRAY_SIZE(pLastArray);
×
2561
  for (SColVal *pColVal = tsdbRowIterNext(&rowIter); pColVal && iCol < nCol && jCol < jnCol;) {
×
2562
    SLastCol *pTargetCol = &((SLastCol *)TARRAY_DATA(pLastArray))[jCol];
×
2563
    if (pColVal->cid < pTargetCol->colVal.cid) {
×
2564
      pColVal = tsdbRowIterNext(&rowIter), ++iCol;
×
2565

2566
      continue;
×
2567
    }
2568
    if (pColVal->cid > pTargetCol->colVal.cid) {
×
2569
      break;
×
2570
    }
2571

2572
    int32_t cmp_res = tRowKeyCompare(&pTargetCol->rowKey, &rowKey.key);
×
2573
    if (!IS_LAST_KEY(((SLastKey *)TARRAY_DATA(keyArray))[jCol])) {
×
2574
      if (cmp_res < 0 || (cmp_res == 0 && !COL_VAL_IS_NONE(pColVal))) {
×
2575
        SLastCol lastCol = {.rowKey = rowKey.key, .colVal = *pColVal, .dirty = 1, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
2576
        TAOS_CHECK_EXIT(tsdbCacheReallocSLastCol(&lastCol, NULL));
×
2577

2578
        tsdbDebug("vgId:%d, %s qid:%s uid:%" PRId64 " from memtable, col_id:%d col_flag:%d ts:%" PRId64,
×
2579
                  TD_VID(pTsdb->pVnode), __func__, pr && pr->idstr ? pr->idstr : "null", uid, lastCol.colVal.cid,
2580
                  lastCol.colVal.flag, rowKey.key.ts);
2581

2582
        tsdbCacheFreeSLastColItem(pTargetCol);
×
2583
        taosArraySet(pLastArray, jCol, &lastCol);
×
2584
      }
2585
    } else {
2586
      if (COL_VAL_IS_VALUE(pColVal)) {
×
2587
        if (cmp_res <= 0) {
×
2588
          SLastCol lastCol = {
×
2589
              .rowKey = rowKey.key, .colVal = *pColVal, .dirty = 1, .cacheStatus = TSDB_LAST_CACHE_VALID};
2590
          TAOS_CHECK_EXIT(tsdbCacheReallocSLastCol(&lastCol, NULL));
×
2591

2592
          tsdbDebug("vgId:%d, %s qid:%s uid:%" PRId64
×
2593
                    " from memtable(last) and memtable(newer), col_id:%d col_flag:%d ts:%" PRId64,
2594
                    TD_VID(pTsdb->pVnode), __func__, pr && pr->idstr ? pr->idstr : "null", uid, lastCol.colVal.cid,
2595
                    lastCol.colVal.flag, rowKey.key.ts);
2596

2597
          tsdbCacheFreeSLastColItem(pTargetCol);
×
2598
          taosArraySet(pLastArray, jCol, &lastCol);
×
2599
        }
2600
      } else {
2601
        if (!iColHash) {
×
2602
          iColHash = tSimpleHashInit(16, taosGetDefaultHashFunction(TSDB_DATA_TYPE_SMALLINT));
×
2603
          if (iColHash == NULL) {
×
2604
            TAOS_CHECK_EXIT(terrno);
×
2605
          }
2606
        }
2607

2608
        if (tSimpleHashPut(iColHash, &pColVal->cid, sizeof(pColVal->cid), &jCol, sizeof(jCol))) {
×
2609
          TAOS_CHECK_EXIT(terrno);
×
2610
        }
2611
      }
2612
    }
2613

2614
    ++jCol;
×
2615

2616
    if (jCol < jnCol && ((SLastCol *)TARRAY_DATA(pLastArray))[jCol].colVal.cid > pColVal->cid) {
×
2617
      pColVal = tsdbRowIterNext(&rowIter), ++iCol;
×
2618
    }
2619
  }
2620
  tsdbRowClose(&rowIter);
×
2621

2622
  if (iColHash && tSimpleHashGetSize(iColHash) > 0) {
×
2623
    pRow = memRowIterGet(&iter, false, NULL, 0);
×
2624
    while (pRow) {
×
2625
      if (tSimpleHashGetSize(iColHash) == 0) {
×
2626
        break;
×
2627
      }
2628

2629
      sversion = TSDBROW_SVERSION(pRow);
×
2630
      if (sversion != -1) {
×
2631
        TAOS_CHECK_EXIT(updateTSchema(sversion, pr, uid));
×
2632

2633
        pTSchema = pr->pCurrSchema;
×
2634
      }
2635
      nCol = pTSchema->numOfCols;
×
2636

2637
      STsdbRowKey tsdbRowKey = {0};
×
2638
      tsdbRowGetKey(pRow, &tsdbRowKey);
×
2639

2640
      TAOS_CHECK_EXIT(tsdbRowIterOpen(&rowIter, pRow, pTSchema));
×
2641

2642
      iCol = 0;
×
2643
      for (SColVal *pColVal = tsdbRowIterNext(&rowIter); pColVal && iCol < nCol;
×
2644
           pColVal = tsdbRowIterNext(&rowIter), iCol++) {
×
2645
        int32_t *pjCol = tSimpleHashGet(iColHash, &pColVal->cid, sizeof(pColVal->cid));
×
2646
        if (pjCol && COL_VAL_IS_VALUE(pColVal)) {
×
2647
          SLastCol *pTargetCol = &((SLastCol *)TARRAY_DATA(pLastArray))[*pjCol];
×
2648

2649
          int32_t cmp_res = tRowKeyCompare(&pTargetCol->rowKey, &tsdbRowKey.key);
×
2650
          if (cmp_res <= 0) {
×
2651
            SLastCol lastCol = {
×
2652
                .rowKey = tsdbRowKey.key, .colVal = *pColVal, .dirty = 1, .cacheStatus = TSDB_LAST_CACHE_VALID};
2653
            TAOS_CHECK_EXIT(tsdbCacheReallocSLastCol(&lastCol, NULL));
×
2654

2655
            tsdbDebug("vgId:%d, %s qid:%s uid:%" PRId64 " from memtable(hash), col_id:%d col_flag:%d ts:%" PRId64,
×
2656
                      TD_VID(pTsdb->pVnode), __func__, pr && pr->idstr ? pr->idstr : "null", uid, lastCol.colVal.cid,
2657
                      lastCol.colVal.flag, tsdbRowKey.key.ts);
2658

2659
            tsdbCacheFreeSLastColItem(pTargetCol);
×
2660
            taosArraySet(pLastArray, *pjCol, &lastCol);
×
2661
          }
2662

2663
          TAOS_CHECK_EXIT(tSimpleHashRemove(iColHash, &pColVal->cid, sizeof(pColVal->cid)));
×
2664
        }
2665
      }
2666
      tsdbRowClose(&rowIter);
×
2667

2668
      pRow = memRowIterGet(&iter, false, NULL, 0);
×
2669
    }
2670
  }
2671

2672
_exit:
×
2673
  if (code) {
×
2674
    tsdbError("vgId:%d %s failed at %s:%d since %s", TD_VID(pTsdb->pVnode), __func__, __FILE__, lino, tstrerror(code));
×
2675

2676
    tsdbRowClose(&rowIter);
×
2677
  }
2678

2679
  tSimpleHashCleanup(iColHash);
×
2680

2681
  memRowIterClose(&iter);
×
2682

2683
  TAOS_RETURN(code);
×
2684
}
2685

2686
int32_t tsdbCacheGetBatch(STsdb *pTsdb, tb_uid_t uid, SArray *pLastArray, SCacheRowsReader *pr, int8_t ltype) {
×
2687
  int32_t code = 0;
×
2688
  int32_t lino = 0;
×
2689

2690
  tsdbDebug("vgId:%d, %s start, qid:%s uid:%" PRId64 " ltype:%d", TD_VID(pTsdb->pVnode), __func__,
×
2691
            pr && pr->idstr ? pr->idstr : "null", uid, ltype);
2692

2693
  SArray *keyArray = taosArrayInit(16, sizeof(SLastKey));
×
2694
  if (!keyArray) {
×
2695
    TAOS_CHECK_EXIT(terrno);
×
2696
  }
2697

2698
  TAOS_CHECK_EXIT(tsdbCacheGetBatchFromLru(pTsdb, uid, pLastArray, pr, ltype, keyArray));
×
2699

2700
  if (tsUpdateCacheBatch) {
×
2701
    TAOS_CHECK_EXIT(tsdbCacheGetBatchFromMem(pTsdb, uid, pLastArray, pr, keyArray));
×
2702
  }
2703

2704
_exit:
×
2705
  if (code) {
×
2706
    tsdbError("vgId:%d %s failed at %s:%d since %s", TD_VID(pTsdb->pVnode), __func__, __FILE__, lino, tstrerror(code));
×
2707
  }
2708

2709
  if (keyArray) {
×
2710
    taosArrayDestroy(keyArray);
×
2711
  }
2712

2713
  TAOS_RETURN(code);
×
2714
}
2715

2716
int32_t tsdbCacheDel(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, TSKEY sKey, TSKEY eKey) {
×
2717
  int32_t   code = 0, lino = 0;
×
2718
  STSchema *pTSchema = NULL;
×
2719
  int       sver = -1;
×
2720
  int       numKeys = 0;
×
2721
  SArray   *remainCols = NULL;
×
2722

2723
  TAOS_CHECK_RETURN(metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, uid, sver, &pTSchema));
×
2724

2725
  int numCols = pTSchema->numOfCols;
×
2726

2727
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
2728

2729
  for (int i = 0; i < numCols; ++i) {
×
2730
    int16_t cid = pTSchema->columns[i].colId;
×
2731
    for (int8_t lflag = LFLAG_LAST_ROW; lflag <= LFLAG_LAST; ++lflag) {
×
2732
      SLastKey   lastKey = {.lflag = lflag, .uid = uid, .cid = cid};
×
2733
      LRUHandle *h = taosLRUCacheLookup(pTsdb->lruCache, &lastKey, ROCKS_KEY_LEN);
×
2734
      if (h) {
×
2735
        SLastCol *pLastCol = (SLastCol *)taosLRUCacheValue(pTsdb->lruCache, h);
×
2736
        if (pLastCol->rowKey.ts <= eKey && pLastCol->rowKey.ts >= sKey) {
×
2737
          SLastCol noneCol = {.rowKey.ts = TSKEY_MIN,
×
2738
                              .colVal = COL_VAL_NONE(cid, pTSchema->columns[i].type),
×
2739
                              .dirty = 1,
2740
                              .cacheStatus = TSDB_LAST_CACHE_NO_CACHE};
2741
          code = tsdbCachePutToLRU(pTsdb, &lastKey, &noneCol, 1);
×
2742
        }
2743
        tsdbLRUCacheRelease(pTsdb->lruCache, h, false);
×
2744
        TAOS_CHECK_EXIT(code);
×
2745
      } else {
2746
        if (!remainCols) {
×
2747
          remainCols = taosArrayInit(numCols * 2, sizeof(SIdxKey));
×
2748
        }
2749
        if (!taosArrayPush(remainCols, &(SIdxKey){i, lastKey})) {
×
2750
          TAOS_CHECK_EXIT(terrno);
×
2751
        }
2752
      }
2753
    }
2754
  }
2755

2756
  if (remainCols) {
×
2757
    numKeys = TARRAY_SIZE(remainCols);
×
2758
  }
2759

2760
  char  **keys_list = taosMemoryCalloc(numKeys, sizeof(char *));
×
2761
  size_t *keys_list_sizes = taosMemoryCalloc(numKeys, sizeof(size_t));
×
2762
  char  **values_list = NULL;
×
2763
  size_t *values_list_sizes = NULL;
×
2764

2765
  if (!keys_list || !keys_list_sizes) {
×
2766
    code = terrno;
×
2767
    goto _exit;
×
2768
  }
2769
  const size_t klen = ROCKS_KEY_LEN;
×
2770

2771
  for (int i = 0; i < numKeys; ++i) {
×
2772
    char *key = taosMemoryCalloc(1, sizeof(SLastKey));
×
2773
    if (!key) {
×
2774
      code = terrno;
×
2775
      goto _exit;
×
2776
    }
2777
    SIdxKey *idxKey = taosArrayGet(remainCols, i);
×
2778

2779
    ((SLastKey *)key)[0] = idxKey->key;
×
2780

2781
    keys_list[i] = key;
×
2782
    keys_list_sizes[i] = klen;
×
2783
  }
2784

2785
  rocksMayWrite(pTsdb, true);  // flush writebatch cache
×
2786

2787
  TAOS_CHECK_GOTO(tsdbCacheGetValuesFromRocks(pTsdb, numKeys, (const char *const *)keys_list, keys_list_sizes,
×
2788
                                              &values_list, &values_list_sizes),
2789
                  NULL, _exit);
2790

2791
  // rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
2792
  for (int i = 0; i < numKeys; ++i) {
×
2793
    SLastCol *pLastCol = NULL;
×
2794
    if (values_list[i] != NULL) {
×
2795
      code = tsdbCacheDeserialize(values_list[i], values_list_sizes[i], &pLastCol);
×
2796
      if (code != TSDB_CODE_SUCCESS) {
×
2797
        tsdbError("vgId:%d, %s deserialize failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
2798
                  tstrerror(code));
2799
        goto _exit;
×
2800
      }
2801
    }
2802
    SIdxKey  *idxKey = taosArrayGet(remainCols, i);
×
2803
    SLastKey *pLastKey = &idxKey->key;
×
2804
    if (NULL != pLastCol && (pLastCol->rowKey.ts <= eKey && pLastCol->rowKey.ts >= sKey)) {
×
2805
      SLastCol noCacheCol = {.rowKey.ts = TSKEY_MIN,
×
2806
                             .colVal = COL_VAL_NONE(pLastKey->cid, pTSchema->columns[idxKey->idx].type),
×
2807
                             .dirty = 0,
2808
                             .cacheStatus = TSDB_LAST_CACHE_NO_CACHE};
2809

2810
      if ((code = tsdbCachePutToRocksdb(pTsdb, pLastKey, &noCacheCol)) != TSDB_CODE_SUCCESS) {
×
2811
        taosMemoryFreeClear(pLastCol);
×
2812
        tsdbError("tsdb/cache/del: vgId:%d, put to rocks failed since %s.", TD_VID(pTsdb->pVnode), tstrerror(code));
×
2813
        goto _exit;
×
2814
      }
2815
      if ((code = tsdbCachePutToLRU(pTsdb, pLastKey, &noCacheCol, 0)) != TSDB_CODE_SUCCESS) {
×
2816
        taosMemoryFreeClear(pLastCol);
×
2817
        tsdbError("tsdb/cache/del: vgId:%d, put to lru failed since %s.", TD_VID(pTsdb->pVnode), tstrerror(code));
×
2818
        goto _exit;
×
2819
      }
2820
    }
2821

2822
    if (pLastCol == NULL) {
×
2823
      tsdbDebug("tsdb/cache/del: vgId:%d, no cache found for uid:%d ,cid:%" PRId64 ", lflag:%d.", TD_VID(pTsdb->pVnode),
×
2824
                pLastKey->cid, pLastKey->uid, pLastKey->lflag);
2825
    }
2826

2827
    taosMemoryFreeClear(pLastCol);
×
2828
  }
2829

2830
  rocksMayWrite(pTsdb, false);
×
2831

2832
_exit:
×
2833
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
2834

2835
  for (int i = 0; i < numKeys; ++i) {
×
2836
    taosMemoryFree(keys_list[i]);
×
2837
  }
2838
  taosMemoryFree(keys_list);
×
2839
  taosMemoryFree(keys_list_sizes);
×
2840
  if (values_list) {
×
2841
#if USE_ROCKSDB
2842
    for (int i = 0; i < numKeys; ++i) {
×
2843
      rocksdb_free(values_list[i]);
×
2844
    }
2845
#endif
2846
    taosMemoryFree(values_list);
×
2847
  }
2848
  taosMemoryFree(values_list_sizes);
×
2849
  taosArrayDestroy(remainCols);
×
2850
  taosMemoryFree(pTSchema);
×
2851

2852
  TAOS_RETURN(code);
×
2853
}
2854

2855
int32_t tsdbOpenCache(STsdb *pTsdb) {
40✔
2856
  int32_t code = 0, lino = 0;
40✔
2857
  size_t  cfgCapacity = (size_t)pTsdb->pVnode->config.cacheLastSize * 1024 * 1024;
40✔
2858

2859
  SLRUCache *pCache = taosLRUCacheInit(cfgCapacity, 0, .5);
40✔
2860
  if (pCache == NULL) {
40✔
2861
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err);
×
2862
  }
2863

2864
#ifdef USE_SHARED_STORAGE
2865
  if (tsSsEnabled) {
40✔
2866
    TAOS_CHECK_GOTO(tsdbOpenBCache(pTsdb), &lino, _err);
×
2867
    TAOS_CHECK_GOTO(tsdbOpenPgCache(pTsdb), &lino, _err);
×
2868
  }
2869
#endif
2870

2871
  TAOS_CHECK_GOTO(tsdbOpenRocksCache(pTsdb), &lino, _err);
40✔
2872

2873
  taosLRUCacheSetStrictCapacity(pCache, false);
40✔
2874

2875
  (void)taosThreadMutexInit(&pTsdb->lruMutex, NULL);
40✔
2876

2877
  pTsdb->lruCache = pCache;
40✔
2878

2879
  TAOS_RETURN(0);
40✔
2880

2881
_err:
×
2882
  if (code) {
×
2883
    tsdbError("tsdb/cache: vgId:%d, open failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino, tstrerror(code));
×
2884
    if (pCache) {
×
2885
      taosLRUCacheCleanup(pCache);
×
2886
      pCache = NULL;
×
2887
    }
2888
  }
2889
  pTsdb->lruCache = pCache;
×
2890
  TAOS_RETURN(code);
×
2891
}
2892

2893
void tsdbCloseCache(STsdb *pTsdb) {
40✔
2894
  SLRUCache *pCache = pTsdb->lruCache;
40✔
2895
  if (pCache) {
40✔
2896
    taosLRUCacheEraseUnrefEntries(pCache);
40✔
2897

2898
    taosLRUCacheCleanup(pCache);
40✔
2899

2900
    (void)taosThreadMutexDestroy(&pTsdb->lruMutex);
40✔
2901
  }
2902

2903
#ifdef USE_SHARED_STORAGE
2904
  if (tsSsEnabled) {
40✔
2905
    tsdbCloseBCache(pTsdb);
×
2906
    tsdbClosePgCache(pTsdb);
×
2907
  }
2908
#endif
2909

2910
  tsdbCloseRocksCache(pTsdb);
40✔
2911
}
40✔
2912

2913
static void getTableCacheKey(tb_uid_t uid, int cacheType, char *key, int *len) {
×
2914
  if (cacheType == 0) {  // last_row
×
2915
    *(uint64_t *)key = (uint64_t)uid;
×
2916
  } else {  // last
2917
    *(uint64_t *)key = ((uint64_t)uid) | 0x8000000000000000;
×
2918
  }
2919

2920
  *len = sizeof(uint64_t);
×
2921
}
×
2922

2923
static tb_uid_t getTableSuidByUid(tb_uid_t uid, STsdb *pTsdb) {
×
2924
  tb_uid_t suid = 0;
×
2925

2926
  SMetaReader mr = {0};
×
2927
  metaReaderDoInit(&mr, pTsdb->pVnode->pMeta, META_READER_LOCK);
×
2928
  if (metaReaderGetTableEntryByUidCache(&mr, uid) < 0) {
×
2929
    metaReaderClear(&mr);  // table not esist
×
2930
    return 0;
×
2931
  }
2932

2933
  if (mr.me.type == TSDB_CHILD_TABLE) {
×
2934
    suid = mr.me.ctbEntry.suid;
×
2935
  } else if (mr.me.type == TSDB_NORMAL_TABLE) {
×
2936
    suid = 0;
×
2937
  } else {
2938
    suid = 0;
×
2939
  }
2940

2941
  metaReaderClear(&mr);
×
2942

2943
  return suid;
×
2944
}
2945

2946
static int32_t getTableDelDataFromDelIdx(SDelFReader *pDelReader, SDelIdx *pDelIdx, SArray *aDelData) {
×
2947
  int32_t code = 0;
×
2948

2949
  if (pDelIdx) {
×
2950
    code = tsdbReadDelDatav1(pDelReader, pDelIdx, aDelData, INT64_MAX);
×
2951
  }
2952

2953
  TAOS_RETURN(code);
×
2954
}
2955

2956
static int32_t getTableDelDataFromTbData(STbData *pTbData, SArray *aDelData) {
×
2957
  int32_t   code = 0;
×
2958
  SDelData *pDelData = pTbData ? pTbData->pHead : NULL;
×
2959

2960
  for (; pDelData; pDelData = pDelData->pNext) {
×
2961
    if (!taosArrayPush(aDelData, pDelData)) {
×
2962
      TAOS_RETURN(terrno);
×
2963
    }
2964
  }
2965

2966
  TAOS_RETURN(code);
×
2967
}
2968

2969
static uint64_t *getUidList(SCacheRowsReader *pReader) {
×
2970
  if (!pReader->uidList) {
×
2971
    int32_t numOfTables = pReader->numOfTables;
×
2972

2973
    pReader->uidList = taosMemoryMalloc(numOfTables * sizeof(uint64_t));
×
2974
    if (!pReader->uidList) {
×
2975
      return NULL;
×
2976
    }
2977

2978
    for (int32_t i = 0; i < numOfTables; ++i) {
×
2979
      uint64_t uid = pReader->pTableList[i].uid;
×
2980
      pReader->uidList[i] = uid;
×
2981
    }
2982

2983
    taosSort(pReader->uidList, numOfTables, sizeof(uint64_t), uidComparFunc);
×
2984
  }
2985

2986
  return pReader->uidList;
×
2987
}
2988

2989
static int32_t loadTombFromBlk(const TTombBlkArray *pTombBlkArray, SCacheRowsReader *pReader, void *pFileReader,
×
2990
                               bool isFile) {
2991
  int32_t   code = 0;
×
2992
  int32_t   numOfTables = pReader->numOfTables;
×
2993
  int64_t   suid = pReader->info.suid;
×
2994
  uint64_t *uidList = getUidList(pReader);
×
2995

2996
  if (!uidList) {
×
2997
    TAOS_RETURN(terrno);
×
2998
  }
2999

3000
  for (int i = 0, j = 0; i < pTombBlkArray->size && j < numOfTables; ++i) {
×
3001
    STombBlk *pTombBlk = &pTombBlkArray->data[i];
×
3002
    if (pTombBlk->maxTbid.suid < suid || (pTombBlk->maxTbid.suid == suid && pTombBlk->maxTbid.uid < uidList[0])) {
×
3003
      continue;
×
3004
    }
3005

3006
    if (pTombBlk->minTbid.suid > suid ||
×
3007
        (pTombBlk->minTbid.suid == suid && pTombBlk->minTbid.uid > uidList[numOfTables - 1])) {
×
3008
      break;
3009
    }
3010

3011
    STombBlock block = {0};
×
3012
    code = isFile ? tsdbDataFileReadTombBlock(pFileReader, &pTombBlkArray->data[i], &block)
×
3013
                  : tsdbSttFileReadTombBlock(pFileReader, &pTombBlkArray->data[i], &block);
×
3014
    if (code != TSDB_CODE_SUCCESS) {
×
3015
      TAOS_RETURN(code);
×
3016
    }
3017

3018
    uint64_t        uid = uidList[j];
×
3019
    STableLoadInfo *pInfo = getTableLoadInfo(pReader, uid);
×
3020
    if (!pInfo) {
×
3021
      tTombBlockDestroy(&block);
×
3022
      TAOS_RETURN(TSDB_CODE_OUT_OF_MEMORY);
×
3023
    }
3024

3025
    if (pInfo->pTombData == NULL) {
×
3026
      pInfo->pTombData = taosArrayInit(4, sizeof(SDelData));
×
3027
    }
3028

3029
    STombRecord record = {0};
×
3030
    bool        finished = false;
×
3031
    for (int32_t k = 0; k < TOMB_BLOCK_SIZE(&block); ++k) {
×
3032
      code = tTombBlockGet(&block, k, &record);
×
3033
      if (code != TSDB_CODE_SUCCESS) {
×
3034
        finished = true;
×
3035
        break;
×
3036
      }
3037

3038
      if (record.suid < suid) {
×
3039
        continue;
×
3040
      }
3041
      if (record.suid > suid) {
×
3042
        finished = true;
×
3043
        break;
×
3044
      }
3045

3046
      bool newTable = false;
×
3047
      if (uid < record.uid) {
×
3048
        while (j < numOfTables && uidList[j] < record.uid) {
×
3049
          ++j;
×
3050
          newTable = true;
×
3051
        }
3052

3053
        if (j >= numOfTables) {
×
3054
          finished = true;
×
3055
          break;
×
3056
        }
3057

3058
        uid = uidList[j];
×
3059
      }
3060

3061
      if (record.uid < uid) {
×
3062
        continue;
×
3063
      }
3064

3065
      if (newTable) {
×
3066
        pInfo = getTableLoadInfo(pReader, uid);
×
3067
        if (!pInfo) {
×
3068
          code = TSDB_CODE_OUT_OF_MEMORY;
×
3069
          finished = true;
×
3070
          break;
×
3071
        }
3072
        if (pInfo->pTombData == NULL) {
×
3073
          pInfo->pTombData = taosArrayInit(4, sizeof(SDelData));
×
3074
          if (!pInfo->pTombData) {
×
3075
            code = terrno;
×
3076
            finished = true;
×
3077
            break;
×
3078
          }
3079
        }
3080
      }
3081

3082
      if (record.version <= pReader->info.verRange.maxVer) {
×
3083
        /*tsdbError("tomb xx load/cache: vgId:%d fid:%d record %" PRId64 "~%" PRId64 "~%" PRId64 " tomb records",
3084
          TD_VID(pReader->pTsdb->pVnode), pReader->pCurFileSet->fid, record.skey, record.ekey, uid);*/
3085

3086
        SDelData delData = {.version = record.version, .sKey = record.skey, .eKey = record.ekey};
×
3087
        if (!taosArrayPush(pInfo->pTombData, &delData)) {
×
3088
          TAOS_RETURN(terrno);
×
3089
        }
3090
      }
3091
    }
3092

3093
    tTombBlockDestroy(&block);
×
3094

3095
    if (finished) {
×
3096
      TAOS_RETURN(code);
×
3097
    }
3098
  }
3099

3100
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
3101
}
3102

3103
static int32_t loadDataTomb(SCacheRowsReader *pReader, SDataFileReader *pFileReader) {
×
3104
  const TTombBlkArray *pBlkArray = NULL;
×
3105

3106
  TAOS_CHECK_RETURN(tsdbDataFileReadTombBlk(pFileReader, &pBlkArray));
×
3107

3108
  TAOS_RETURN(loadTombFromBlk(pBlkArray, pReader, pFileReader, true));
×
3109
}
3110

3111
static int32_t loadSttTomb(STsdbReader *pTsdbReader, SSttFileReader *pSttFileReader, SSttBlockLoadInfo *pLoadInfo) {
×
3112
  SCacheRowsReader    *pReader = (SCacheRowsReader *)pTsdbReader;
×
3113
  const TTombBlkArray *pBlkArray = NULL;
×
3114

3115
  TAOS_CHECK_RETURN(tsdbSttFileReadTombBlk(pSttFileReader, &pBlkArray));
×
3116

3117
  TAOS_RETURN(loadTombFromBlk(pBlkArray, pReader, pSttFileReader, false));
×
3118
}
3119

3120
typedef struct {
3121
  SMergeTree  mergeTree;
3122
  SMergeTree *pMergeTree;
3123
} SFSLastIter;
3124

3125
static int32_t lastIterOpen(SFSLastIter *iter, STFileSet *pFileSet, STsdb *pTsdb, STSchema *pTSchema, tb_uid_t suid,
×
3126
                            tb_uid_t uid, SCacheRowsReader *pr, int64_t lastTs, int16_t *aCols, int nCols) {
3127
  int32_t code = 0;
×
3128
  destroySttBlockReader(pr->pLDataIterArray, NULL);
×
3129
  pr->pLDataIterArray = taosArrayInit(4, POINTER_BYTES);
×
3130
  if (pr->pLDataIterArray == NULL) return terrno;
×
3131

3132
  SMergeTreeConf conf = {
×
3133
      .uid = uid,
3134
      .suid = suid,
3135
      .pTsdb = pTsdb,
3136
      .timewindow = (STimeWindow){.skey = lastTs, .ekey = TSKEY_MAX},
3137
      .verRange = (SVersionRange){.minVer = 0, .maxVer = INT64_MAX},
3138
      .strictTimeRange = false,
3139
      .cacheStatis = false,
3140
      .pSchema = pTSchema,
3141
      .pCurrentFileset = pFileSet,
3142
      .backward = 1,
3143
      .pSttFileBlockIterArray = pr->pLDataIterArray,
×
3144
      .pCols = aCols,
3145
      .numOfCols = nCols,
3146
      .loadTombFn = loadSttTomb,
3147
      .pReader = pr,
3148
      .idstr = pr->idstr,
×
3149
      .pCurRowKey = &pr->rowKey,
×
3150
  };
3151

3152
  TAOS_CHECK_RETURN(tMergeTreeOpen2(&iter->mergeTree, &conf, NULL));
×
3153

3154
  iter->pMergeTree = &iter->mergeTree;
×
3155

3156
  TAOS_RETURN(code);
×
3157
}
3158

3159
static int32_t lastIterClose(SFSLastIter **iter) {
×
3160
  int32_t code = 0;
×
3161

3162
  if ((*iter)->pMergeTree) {
×
3163
    tMergeTreeClose((*iter)->pMergeTree);
×
3164
    (*iter)->pMergeTree = NULL;
×
3165
  }
3166

3167
  *iter = NULL;
×
3168

3169
  TAOS_RETURN(code);
×
3170
}
3171

3172
static int32_t lastIterNext(SFSLastIter *iter, TSDBROW **ppRow) {
×
3173
  bool hasVal = false;
×
3174
  *ppRow = NULL;
×
3175

3176
  int32_t code = tMergeTreeNext(iter->pMergeTree, &hasVal);
×
3177
  if (code != 0) {
×
3178
    return code;
×
3179
  }
3180

3181
  if (!hasVal) {
×
3182
    *ppRow = NULL;
×
3183
    TAOS_RETURN(code);
×
3184
  }
3185

3186
  *ppRow = tMergeTreeGetRow(iter->pMergeTree);
×
3187
  TAOS_RETURN(code);
×
3188
}
3189

3190
typedef enum SFSNEXTROWSTATES {
3191
  SFSNEXTROW_FS,
3192
  SFSNEXTROW_FILESET,
3193
  SFSNEXTROW_INDEXLIST,
3194
  SFSNEXTROW_BRINBLOCK,
3195
  SFSNEXTROW_BRINRECORD,
3196
  SFSNEXTROW_BLOCKDATA,
3197
  SFSNEXTROW_BLOCKROW,
3198
  SFSNEXTROW_NEXTSTTROW
3199
} SFSNEXTROWSTATES;
3200

3201
struct CacheNextRowIter;
3202

3203
typedef struct SFSNextRowIter {
3204
  SFSNEXTROWSTATES         state;         // [input]
3205
  SBlockIdx               *pBlockIdxExp;  // [input]
3206
  STSchema                *pTSchema;      // [input]
3207
  tb_uid_t                 suid;
3208
  tb_uid_t                 uid;
3209
  int32_t                  iFileSet;
3210
  STFileSet               *pFileSet;
3211
  TFileSetArray           *aDFileSet;
3212
  SArray                  *pIndexList;
3213
  int32_t                  iBrinIndex;
3214
  SBrinBlock               brinBlock;
3215
  SBrinBlock              *pBrinBlock;
3216
  int32_t                  iBrinRecord;
3217
  SBrinRecord              brinRecord;
3218
  SBlockData               blockData;
3219
  SBlockData              *pBlockData;
3220
  int32_t                  nRow;
3221
  int32_t                  iRow;
3222
  TSDBROW                  row;
3223
  int64_t                  lastTs;
3224
  SFSLastIter              lastIter;
3225
  SFSLastIter             *pLastIter;
3226
  int8_t                   lastEmpty;
3227
  TSDBROW                 *pLastRow;
3228
  SRow                    *pTSRow;
3229
  SRowMerger               rowMerger;
3230
  SCacheRowsReader        *pr;
3231
  struct CacheNextRowIter *pRowIter;
3232
} SFSNextRowIter;
3233

3234
static void clearLastFileSet(SFSNextRowIter *state);
3235

3236
static int32_t getNextRowFromFS(void *iter, TSDBROW **ppRow, bool *pIgnoreEarlierTs, bool isLast, int16_t *aCols,
×
3237
                                int nCols) {
3238
  int32_t         code = 0, lino = 0;
×
3239
  SFSNextRowIter *state = (SFSNextRowIter *)iter;
×
3240
  STsdb          *pTsdb = state->pr->pTsdb;
×
3241

3242
  if (SFSNEXTROW_FS == state->state) {
×
3243
    state->iFileSet = TARRAY2_SIZE(state->aDFileSet);
×
3244

3245
    state->state = SFSNEXTROW_FILESET;
×
3246
  }
3247

3248
  if (SFSNEXTROW_FILESET == state->state) {
×
3249
  _next_fileset:
×
3250
    clearLastFileSet(state);
×
3251

3252
    if (--state->iFileSet < 0) {
×
3253
      *ppRow = NULL;
×
3254

3255
      TAOS_RETURN(code);
×
3256
    } else {
3257
      state->pFileSet = TARRAY2_GET(state->aDFileSet, state->iFileSet);
×
3258
    }
3259

3260
    STFileObj **pFileObj = state->pFileSet->farr;
×
3261
    if (pFileObj[0] != NULL || pFileObj[3] != NULL) {
×
3262
      if (state->pFileSet != state->pr->pCurFileSet) {
×
3263
        SDataFileReaderConfig conf = {.tsdb = pTsdb, .szPage = pTsdb->pVnode->config.tsdbPageSize};
×
3264
        const char           *filesName[4] = {0};
×
3265
        if (pFileObj[0] != NULL) {
×
3266
          conf.files[0].file = *pFileObj[0]->f;
×
3267
          conf.files[0].exist = true;
×
3268
          filesName[0] = pFileObj[0]->fname;
×
3269

3270
          conf.files[1].file = *pFileObj[1]->f;
×
3271
          conf.files[1].exist = true;
×
3272
          filesName[1] = pFileObj[1]->fname;
×
3273

3274
          conf.files[2].file = *pFileObj[2]->f;
×
3275
          conf.files[2].exist = true;
×
3276
          filesName[2] = pFileObj[2]->fname;
×
3277
        }
3278

3279
        if (pFileObj[3] != NULL) {
×
3280
          conf.files[3].exist = true;
×
3281
          conf.files[3].file = *pFileObj[3]->f;
×
3282
          filesName[3] = pFileObj[3]->fname;
×
3283
        }
3284

3285
        TAOS_CHECK_GOTO(tsdbDataFileReaderOpen(filesName, &conf, &state->pr->pFileReader), &lino, _err);
×
3286

3287
        state->pr->pCurFileSet = state->pFileSet;
×
3288

3289
        code = loadDataTomb(state->pr, state->pr->pFileReader);
×
3290
        if (code != TSDB_CODE_SUCCESS) {
×
3291
          tsdbError("vgId:%d, %s load tomb failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
3292
                    tstrerror(code));
3293
          TAOS_CHECK_GOTO(code, &lino, _err);
×
3294
        }
3295

3296
        TAOS_CHECK_GOTO(tsdbDataFileReadBrinBlk(state->pr->pFileReader, &state->pr->pBlkArray), &lino, _err);
×
3297
      }
3298

3299
      if (!state->pIndexList) {
×
3300
        state->pIndexList = taosArrayInit(1, sizeof(SBrinBlk));
×
3301
        if (!state->pIndexList) {
×
3302
          TAOS_CHECK_GOTO(terrno, &lino, _err);
×
3303
        }
3304
      } else {
3305
        taosArrayClear(state->pIndexList);
×
3306
      }
3307

3308
      const TBrinBlkArray *pBlkArray = state->pr->pBlkArray;
×
3309

3310
      for (int i = TARRAY2_SIZE(pBlkArray) - 1; i >= 0; --i) {
×
3311
        SBrinBlk *pBrinBlk = &pBlkArray->data[i];
×
3312
        if (state->suid >= pBrinBlk->minTbid.suid && state->suid <= pBrinBlk->maxTbid.suid) {
×
3313
          if (state->uid >= pBrinBlk->minTbid.uid && state->uid <= pBrinBlk->maxTbid.uid) {
×
3314
            if (!taosArrayPush(state->pIndexList, pBrinBlk)) {
×
3315
              TAOS_CHECK_GOTO(terrno, &lino, _err);
×
3316
            }
3317
          }
3318
        } else if (state->suid > pBrinBlk->maxTbid.suid ||
×
3319
                   (state->suid == pBrinBlk->maxTbid.suid && state->uid > pBrinBlk->maxTbid.uid)) {
×
3320
          break;
3321
        }
3322
      }
3323

3324
      int indexSize = TARRAY_SIZE(state->pIndexList);
×
3325
      if (indexSize <= 0) {
×
3326
        goto _check_stt_data;
×
3327
      }
3328

3329
      state->state = SFSNEXTROW_INDEXLIST;
×
3330
      state->iBrinIndex = 1;
×
3331
    }
3332

3333
  _check_stt_data:
×
3334
    if (state->pFileSet != state->pr->pCurFileSet) {
×
3335
      state->pr->pCurFileSet = state->pFileSet;
×
3336
    }
3337

3338
    TAOS_CHECK_GOTO(lastIterOpen(&state->lastIter, state->pFileSet, pTsdb, state->pTSchema, state->suid, state->uid,
×
3339
                                 state->pr, state->lastTs, aCols, nCols),
3340
                    &lino, _err);
3341

3342
    TAOS_CHECK_GOTO(lastIterNext(&state->lastIter, &state->pLastRow), &lino, _err);
×
3343

3344
    if (!state->pLastRow) {
×
3345
      state->lastEmpty = 1;
×
3346

3347
      if (SFSNEXTROW_INDEXLIST != state->state) {
×
3348
        clearLastFileSet(state);
×
3349
        goto _next_fileset;
×
3350
      }
3351
    } else {
3352
      state->lastEmpty = 0;
×
3353

3354
      if (SFSNEXTROW_INDEXLIST != state->state) {
×
3355
        state->state = SFSNEXTROW_NEXTSTTROW;
×
3356

3357
        *ppRow = state->pLastRow;
×
3358
        state->pLastRow = NULL;
×
3359

3360
        TAOS_RETURN(code);
×
3361
      }
3362
    }
3363

3364
    state->pLastIter = &state->lastIter;
×
3365
  }
3366

3367
  if (SFSNEXTROW_NEXTSTTROW == state->state) {
×
3368
    TAOS_CHECK_GOTO(lastIterNext(&state->lastIter, &state->pLastRow), &lino, _err);
×
3369

3370
    if (!state->pLastRow) {
×
3371
      if (state->pLastIter) {
×
3372
        code = lastIterClose(&state->pLastIter);
×
3373
        if (code != TSDB_CODE_SUCCESS) {
×
3374
          tsdbError("vgId:%d, %s close last iter failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
3375
                    tstrerror(code));
3376
          TAOS_RETURN(code);
×
3377
        }
3378
      }
3379

3380
      clearLastFileSet(state);
×
3381
      state->state = SFSNEXTROW_FILESET;
×
3382
      goto _next_fileset;
×
3383
    } else {
3384
      *ppRow = state->pLastRow;
×
3385
      state->pLastRow = NULL;
×
3386

3387
      TAOS_RETURN(code);
×
3388
    }
3389
  }
3390

3391
  if (SFSNEXTROW_INDEXLIST == state->state) {
×
3392
    SBrinBlk *pBrinBlk = NULL;
×
3393
  _next_brinindex:
×
3394
    if (--state->iBrinIndex < 0) {
×
3395
      if (state->pLastRow) {
×
3396
        state->state = SFSNEXTROW_NEXTSTTROW;
×
3397
        *ppRow = state->pLastRow;
×
3398
        state->pLastRow = NULL;
×
3399
        return code;
×
3400
      }
3401

3402
      clearLastFileSet(state);
×
3403
      goto _next_fileset;
×
3404
    } else {
3405
      pBrinBlk = taosArrayGet(state->pIndexList, state->iBrinIndex);
×
3406
    }
3407

3408
    if (!state->pBrinBlock) {
×
3409
      state->pBrinBlock = &state->brinBlock;
×
3410
    } else {
3411
      tBrinBlockClear(&state->brinBlock);
×
3412
    }
3413

3414
    TAOS_CHECK_GOTO(tsdbDataFileReadBrinBlock(state->pr->pFileReader, pBrinBlk, &state->brinBlock), &lino, _err);
×
3415

3416
    state->iBrinRecord = state->brinBlock.numOfRecords - 1;
×
3417
    state->state = SFSNEXTROW_BRINBLOCK;
×
3418
  }
3419

3420
  if (SFSNEXTROW_BRINBLOCK == state->state) {
×
3421
  _next_brinrecord:
×
3422
    if (state->iBrinRecord < 0) {  // empty brin block, goto _next_brinindex
×
3423
      tBrinBlockClear(&state->brinBlock);
×
3424
      goto _next_brinindex;
×
3425
    }
3426

3427
    TAOS_CHECK_GOTO(tBrinBlockGet(&state->brinBlock, state->iBrinRecord, &state->brinRecord), &lino, _err);
×
3428

3429
    SBrinRecord *pRecord = &state->brinRecord;
×
3430
    if (pRecord->uid != state->uid) {
×
3431
      // TODO: goto next brin block early
3432
      --state->iBrinRecord;
×
3433
      goto _next_brinrecord;
×
3434
    }
3435

3436
    state->state = SFSNEXTROW_BRINRECORD;
×
3437
  }
3438

3439
  if (SFSNEXTROW_BRINRECORD == state->state) {
×
3440
    SBrinRecord *pRecord = &state->brinRecord;
×
3441

3442
    if (!state->pBlockData) {
×
3443
      state->pBlockData = &state->blockData;
×
3444

3445
      TAOS_CHECK_GOTO(tBlockDataCreate(&state->blockData), &lino, _err);
×
3446
    } else {
3447
      tBlockDataReset(state->pBlockData);
×
3448
    }
3449

3450
    if (aCols[0] == PRIMARYKEY_TIMESTAMP_COL_ID) {
×
3451
      --nCols;
×
3452
      ++aCols;
×
3453
    }
3454

3455
    TAOS_CHECK_GOTO(tsdbDataFileReadBlockDataByColumn(state->pr->pFileReader, pRecord, state->pBlockData,
×
3456
                                                      state->pTSchema, aCols, nCols),
3457
                    &lino, _err);
3458

3459
    state->nRow = state->blockData.nRow;
×
3460
    state->iRow = state->nRow - 1;
×
3461

3462
    state->state = SFSNEXTROW_BLOCKROW;
×
3463
  }
3464

3465
  if (SFSNEXTROW_BLOCKROW == state->state) {
×
3466
    if (state->iRow < 0) {
×
3467
      --state->iBrinRecord;
×
3468
      goto _next_brinrecord;
×
3469
    }
3470

3471
    state->row = tsdbRowFromBlockData(state->pBlockData, state->iRow);
×
3472
    if (!state->pLastIter) {
×
3473
      *ppRow = &state->row;
×
3474
      --state->iRow;
×
3475
      return code;
×
3476
    }
3477

3478
    if (!state->pLastRow) {
×
3479
      // get next row from fslast and process with fs row, --state->Row if select fs row
3480
      TAOS_CHECK_GOTO(lastIterNext(&state->lastIter, &state->pLastRow), &lino, _err);
×
3481
    }
3482

3483
    if (!state->pLastRow) {
×
3484
      if (state->pLastIter) {
×
3485
        code = lastIterClose(&state->pLastIter);
×
3486
        if (code != TSDB_CODE_SUCCESS) {
×
3487
          tsdbError("vgId:%d, %s close last iter failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
3488
                    tstrerror(code));
3489
          TAOS_RETURN(code);
×
3490
        }
3491
      }
3492

3493
      *ppRow = &state->row;
×
3494
      --state->iRow;
×
3495
      return code;
×
3496
    }
3497

3498
    // process state->pLastRow & state->row
3499
    TSKEY rowTs = TSDBROW_TS(&state->row);
×
3500
    TSKEY lastRowTs = TSDBROW_TS(state->pLastRow);
×
3501
    if (lastRowTs > rowTs) {
×
3502
      *ppRow = state->pLastRow;
×
3503
      state->pLastRow = NULL;
×
3504

3505
      TAOS_RETURN(code);
×
3506
    } else if (lastRowTs < rowTs) {
×
3507
      *ppRow = &state->row;
×
3508
      --state->iRow;
×
3509

3510
      TAOS_RETURN(code);
×
3511
    } else {
3512
      // TODO: merge rows and *ppRow = mergedRow
3513
      SRowMerger *pMerger = &state->rowMerger;
×
3514
      code = tsdbRowMergerInit(pMerger, state->pTSchema);
×
3515
      if (code != TSDB_CODE_SUCCESS) {
×
3516
        tsdbError("vgId:%d, %s init row merger failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
3517
                  tstrerror(code));
3518
        TAOS_RETURN(code);
×
3519
      }
3520

3521
      TAOS_CHECK_GOTO(tsdbRowMergerAdd(pMerger, &state->row, state->pTSchema), &lino, _err);
×
3522
      TAOS_CHECK_GOTO(tsdbRowMergerAdd(pMerger, state->pLastRow, state->pTSchema), &lino, _err);
×
3523

3524
      if (state->pTSRow) {
×
3525
        taosMemoryFree(state->pTSRow);
×
3526
        state->pTSRow = NULL;
×
3527
      }
3528

3529
      TAOS_CHECK_GOTO(tsdbRowMergerGetRow(pMerger, &state->pTSRow), &lino, _err);
×
3530

3531
      state->row = tsdbRowFromTSRow(TSDBROW_VERSION(&state->row), state->pTSRow);
×
3532
      *ppRow = &state->row;
×
3533
      --state->iRow;
×
3534

3535
      tsdbRowMergerClear(pMerger);
×
3536

3537
      TAOS_RETURN(code);
×
3538
    }
3539
  }
3540

3541
_err:
×
3542
  clearLastFileSet(state);
×
3543

3544
  *ppRow = NULL;
×
3545

3546
  if (code) {
×
3547
    tsdbError("tsdb/cache: vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, lino,
×
3548
              tstrerror(code));
3549
  }
3550

3551
  TAOS_RETURN(code);
×
3552
}
3553

3554
typedef struct CacheNextRowIter {
3555
  SArray           *pMemDelData;
3556
  SArray           *pSkyline;
3557
  int64_t           iSkyline;
3558
  SBlockIdx         idx;
3559
  SMemNextRowIter   memState;
3560
  SMemNextRowIter   imemState;
3561
  SFSNextRowIter    fsState;
3562
  TSDBROW           memRow, imemRow, fsLastRow, fsRow;
3563
  TsdbNextRowState  input[3];
3564
  SCacheRowsReader *pr;
3565
  STsdb            *pTsdb;
3566
} CacheNextRowIter;
3567

3568
int32_t clearNextRowFromFS(void *iter) {
×
3569
  int32_t code = 0;
×
3570

3571
  SFSNextRowIter *state = (SFSNextRowIter *)iter;
×
3572
  if (!state) {
×
3573
    TAOS_RETURN(code);
×
3574
  }
3575

3576
  if (state->pLastIter) {
×
3577
    code = lastIterClose(&state->pLastIter);
×
3578
    if (code != TSDB_CODE_SUCCESS) {
×
3579
      tsdbError("%s close last iter failed at line %d since %s", __func__, __LINE__, tstrerror(code));
×
3580
      TAOS_RETURN(code);
×
3581
    }
3582
  }
3583

3584
  if (state->pBlockData) {
×
3585
    tBlockDataDestroy(state->pBlockData);
×
3586
    state->pBlockData = NULL;
×
3587
  }
3588

3589
  if (state->pBrinBlock) {
×
3590
    tBrinBlockDestroy(state->pBrinBlock);
×
3591
    state->pBrinBlock = NULL;
×
3592
  }
3593

3594
  if (state->pIndexList) {
×
3595
    taosArrayDestroy(state->pIndexList);
×
3596
    state->pIndexList = NULL;
×
3597
  }
3598

3599
  if (state->pTSRow) {
×
3600
    taosMemoryFree(state->pTSRow);
×
3601
    state->pTSRow = NULL;
×
3602
  }
3603

3604
  if (state->pRowIter->pSkyline) {
×
3605
    taosArrayDestroy(state->pRowIter->pSkyline);
×
3606
    state->pRowIter->pSkyline = NULL;
×
3607
  }
3608

3609
  TAOS_RETURN(code);
×
3610
}
3611

3612
static void clearLastFileSet(SFSNextRowIter *state) {
×
3613
  if (state->pLastIter) {
×
3614
    int code = lastIterClose(&state->pLastIter);
×
3615
    if (code != TSDB_CODE_SUCCESS) {
×
3616
      tsdbError("%s close last iter failed at line %d since %s", __func__, __LINE__, tstrerror(code));
×
3617
      return;
×
3618
    }
3619
  }
3620

3621
  if (state->pBlockData) {
×
3622
    tBlockDataDestroy(state->pBlockData);
×
3623
    state->pBlockData = NULL;
×
3624
  }
3625

3626
  if (state->pr->pFileReader) {
×
3627
    tsdbDataFileReaderClose(&state->pr->pFileReader);
×
3628
    state->pr->pFileReader = NULL;
×
3629

3630
    state->pr->pCurFileSet = NULL;
×
3631
  }
3632

3633
  if (state->pTSRow) {
×
3634
    taosMemoryFree(state->pTSRow);
×
3635
    state->pTSRow = NULL;
×
3636
  }
3637

3638
  if (state->pRowIter->pSkyline) {
×
3639
    taosArrayDestroy(state->pRowIter->pSkyline);
×
3640
    state->pRowIter->pSkyline = NULL;
×
3641

3642
    void   *pe = NULL;
×
3643
    int32_t iter = 0;
×
3644
    while ((pe = tSimpleHashIterate(state->pr->pTableMap, pe, &iter)) != NULL) {
×
3645
      STableLoadInfo *pInfo = *(STableLoadInfo **)pe;
×
3646
      taosArrayDestroy(pInfo->pTombData);
×
3647
      pInfo->pTombData = NULL;
×
3648
    }
3649
  }
3650
}
3651

3652
static int32_t nextRowIterOpen(CacheNextRowIter *pIter, tb_uid_t uid, STsdb *pTsdb, STSchema *pTSchema, tb_uid_t suid,
×
3653
                               SArray *pLDataIterArray, STsdbReadSnap *pReadSnap, int64_t lastTs,
3654
                               SCacheRowsReader *pr) {
3655
  int32_t code = 0, lino = 0;
×
3656

3657
  STbData *pMem = NULL;
×
3658
  if (pReadSnap->pMem) {
×
3659
    pMem = tsdbGetTbDataFromMemTable(pReadSnap->pMem, suid, uid);
×
3660
  }
3661

3662
  STbData *pIMem = NULL;
×
3663
  if (pReadSnap->pIMem) {
×
3664
    pIMem = tsdbGetTbDataFromMemTable(pReadSnap->pIMem, suid, uid);
×
3665
  }
3666

3667
  pIter->pTsdb = pTsdb;
×
3668

3669
  pIter->pMemDelData = NULL;
×
3670

3671
  TAOS_CHECK_GOTO(loadMemTombData(&pIter->pMemDelData, pMem, pIMem, pr->info.verRange.maxVer), &lino, _err);
×
3672

3673
  pIter->idx = (SBlockIdx){.suid = suid, .uid = uid};
×
3674

3675
  pIter->fsState.pRowIter = pIter;
×
3676
  pIter->fsState.state = SFSNEXTROW_FS;
×
3677
  pIter->fsState.aDFileSet = pReadSnap->pfSetArray;
×
3678
  pIter->fsState.pBlockIdxExp = &pIter->idx;
×
3679
  pIter->fsState.pTSchema = pTSchema;
×
3680
  pIter->fsState.suid = suid;
×
3681
  pIter->fsState.uid = uid;
×
3682
  pIter->fsState.lastTs = lastTs;
×
3683
  pIter->fsState.pr = pr;
×
3684

3685
  pIter->input[0] = (TsdbNextRowState){&pIter->memRow, true, false, false, &pIter->memState, getNextRowFromMem, NULL};
×
3686
  pIter->input[1] = (TsdbNextRowState){&pIter->imemRow, true, false, false, &pIter->imemState, getNextRowFromMem, NULL};
×
3687
  pIter->input[2] =
×
3688
      (TsdbNextRowState){&pIter->fsRow, false, true, false, &pIter->fsState, getNextRowFromFS, clearNextRowFromFS};
×
3689

3690
  if (pMem) {
×
3691
    pIter->memState.pMem = pMem;
×
3692
    pIter->memState.state = SMEMNEXTROW_ENTER;
×
3693
    pIter->memState.lastTs = lastTs;
×
3694
    pIter->input[0].stop = false;
×
3695
    pIter->input[0].next = true;
×
3696
  }
3697

3698
  if (pIMem) {
×
3699
    pIter->imemState.pMem = pIMem;
×
3700
    pIter->imemState.state = SMEMNEXTROW_ENTER;
×
3701
    pIter->imemState.lastTs = lastTs;
×
3702
    pIter->input[1].stop = false;
×
3703
    pIter->input[1].next = true;
×
3704
  }
3705

3706
  pIter->pr = pr;
×
3707

3708
_err:
×
3709
  TAOS_RETURN(code);
×
3710
}
3711

3712
static void nextRowIterClose(CacheNextRowIter *pIter) {
×
3713
  for (int i = 0; i < 3; ++i) {
×
3714
    if (pIter->input[i].nextRowClearFn) {
×
3715
      (void)pIter->input[i].nextRowClearFn(pIter->input[i].iter);
×
3716
    }
3717
  }
3718

3719
  if (pIter->pSkyline) {
×
3720
    taosArrayDestroy(pIter->pSkyline);
×
3721
  }
3722

3723
  if (pIter->pMemDelData) {
×
3724
    taosArrayDestroy(pIter->pMemDelData);
×
3725
  }
3726
}
×
3727

3728
// iterate next row non deleted backward ts, version (from high to low)
3729
static int32_t nextRowIterGet(CacheNextRowIter *pIter, TSDBROW **ppRow, bool *pIgnoreEarlierTs, bool isLast,
×
3730
                              int16_t *aCols, int nCols) {
3731
  int32_t code = 0, lino = 0;
×
3732

3733
  for (;;) {
×
3734
    for (int i = 0; i < 3; ++i) {
×
3735
      if (pIter->input[i].next && !pIter->input[i].stop) {
×
3736
        TAOS_CHECK_GOTO(pIter->input[i].nextRowFn(pIter->input[i].iter, &pIter->input[i].pRow,
×
3737
                                                  &pIter->input[i].ignoreEarlierTs, isLast, aCols, nCols),
3738
                        &lino, _err);
3739

3740
        if (pIter->input[i].pRow == NULL) {
×
3741
          pIter->input[i].stop = true;
×
3742
          pIter->input[i].next = false;
×
3743
        }
3744
      }
3745
    }
3746

3747
    if (pIter->input[0].stop && pIter->input[1].stop && pIter->input[2].stop) {
×
3748
      *ppRow = NULL;
×
3749
      *pIgnoreEarlierTs =
×
3750
          (pIter->input[0].ignoreEarlierTs || pIter->input[1].ignoreEarlierTs || pIter->input[2].ignoreEarlierTs);
×
3751

3752
      TAOS_RETURN(code);
×
3753
    }
3754

3755
    // select maxpoint(s) from mem, imem, fs and last
3756
    TSDBROW *max[4] = {0};
×
3757
    int      iMax[4] = {-1, -1, -1, -1};
×
3758
    int      nMax = 0;
×
3759
    SRowKey  maxKey = {.ts = TSKEY_MIN};
×
3760

3761
    for (int i = 0; i < 3; ++i) {
×
3762
      if (!pIter->input[i].stop && pIter->input[i].pRow != NULL) {
×
3763
        STsdbRowKey tsdbRowKey = {0};
×
3764
        tsdbRowGetKey(pIter->input[i].pRow, &tsdbRowKey);
×
3765

3766
        // merging & deduplicating on client side
3767
        int c = tRowKeyCompare(&maxKey, &tsdbRowKey.key);
×
3768
        if (c <= 0) {
×
3769
          if (c < 0) {
×
3770
            nMax = 0;
×
3771
            maxKey = tsdbRowKey.key;
×
3772
          }
3773

3774
          iMax[nMax] = i;
×
3775
          max[nMax++] = pIter->input[i].pRow;
×
3776
        }
3777
        pIter->input[i].next = false;
×
3778
      }
3779
    }
3780

3781
    // delete detection
3782
    TSDBROW *merge[4] = {0};
×
3783
    int      iMerge[4] = {-1, -1, -1, -1};
×
3784
    int      nMerge = 0;
×
3785
    for (int i = 0; i < nMax; ++i) {
×
3786
      TSDBKEY maxKey1 = TSDBROW_KEY(max[i]);
×
3787

3788
      if (!pIter->pSkyline) {
×
3789
        pIter->pSkyline = taosArrayInit(32, sizeof(TSDBKEY));
×
3790
        TSDB_CHECK_NULL(pIter->pSkyline, code, lino, _err, terrno);
×
3791

3792
        uint64_t        uid = pIter->idx.uid;
×
3793
        STableLoadInfo *pInfo = getTableLoadInfo(pIter->pr, uid);
×
3794
        TSDB_CHECK_NULL(pInfo, code, lino, _err, TSDB_CODE_OUT_OF_MEMORY);
×
3795

3796
        if (pInfo->pTombData == NULL) {
×
3797
          pInfo->pTombData = taosArrayInit(4, sizeof(SDelData));
×
3798
          TSDB_CHECK_NULL(pInfo->pTombData, code, lino, _err, terrno);
×
3799
        }
3800

3801
        if (!taosArrayAddAll(pInfo->pTombData, pIter->pMemDelData)) {
×
3802
          TAOS_CHECK_GOTO(terrno, &lino, _err);
×
3803
        }
3804

3805
        size_t delSize = TARRAY_SIZE(pInfo->pTombData);
×
3806
        if (delSize > 0) {
×
3807
          code = tsdbBuildDeleteSkyline(pInfo->pTombData, 0, (int32_t)(delSize - 1), pIter->pSkyline);
×
3808
          TAOS_CHECK_GOTO(code, &lino, _err);
×
3809
        }
3810
        pIter->iSkyline = taosArrayGetSize(pIter->pSkyline) - 1;
×
3811
      }
3812

3813
      bool deleted = tsdbKeyDeleted(&maxKey1, pIter->pSkyline, &pIter->iSkyline);
×
3814
      if (!deleted) {
×
3815
        iMerge[nMerge] = iMax[i];
×
3816
        merge[nMerge++] = max[i];
×
3817
      }
3818

3819
      pIter->input[iMax[i]].next = deleted;
×
3820
    }
3821

3822
    if (nMerge > 0) {
×
3823
      pIter->input[iMerge[0]].next = true;
×
3824

3825
      *ppRow = merge[0];
×
3826

3827
      TAOS_RETURN(code);
×
3828
    }
3829
  }
3830

3831
_err:
×
3832
  if (code) {
×
3833
    tsdbError("tsdb/cache: %s failed at line %d since %s.", __func__, lino, tstrerror(code));
×
3834
  }
3835

3836
  TAOS_RETURN(code);
×
3837
}
3838

3839
static int32_t initLastColArrayPartial(STSchema *pTSchema, SArray **ppColArray, int16_t *slotIds, int nCols) {
×
3840
  SArray *pColArray = taosArrayInit(nCols, sizeof(SLastCol));
×
3841
  if (NULL == pColArray) {
×
3842
    TAOS_RETURN(terrno);
×
3843
  }
3844

3845
  for (int32_t i = 0; i < nCols; ++i) {
×
3846
    int16_t  slotId = slotIds[i];
×
3847
    SLastCol col = {.rowKey.ts = 0,
×
3848
                    .colVal = COL_VAL_NULL(pTSchema->columns[slotId].colId, pTSchema->columns[slotId].type)};
×
3849
    if (!taosArrayPush(pColArray, &col)) {
×
3850
      TAOS_RETURN(terrno);
×
3851
    }
3852
  }
3853
  *ppColArray = pColArray;
×
3854

3855
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
3856
}
3857

3858
static int32_t mergeLastCid(tb_uid_t uid, STsdb *pTsdb, SArray **ppLastArray, SCacheRowsReader *pr, int16_t *aCols,
×
3859
                            int nCols, int16_t *slotIds) {
3860
  int32_t   code = 0, lino = 0;
×
3861
  STSchema *pTSchema = pr->pSchema;  // metaGetTbTSchema(pTsdb->pVnode->pMeta, uid, -1, 1);
×
3862
  int16_t   nLastCol = nCols;
×
3863
  int16_t   noneCol = 0;
×
3864
  bool      setNoneCol = false;
×
3865
  bool      hasRow = false;
×
3866
  bool      ignoreEarlierTs = false;
×
3867
  SArray   *pColArray = NULL;
×
3868
  SColVal  *pColVal = &(SColVal){0};
×
3869

3870
  TAOS_CHECK_RETURN(initLastColArrayPartial(pTSchema, &pColArray, slotIds, nCols));
×
3871

3872
  SArray *aColArray = taosArrayInit(nCols, sizeof(int16_t));
×
3873
  if (NULL == aColArray) {
×
3874
    taosArrayDestroy(pColArray);
×
3875

3876
    TAOS_RETURN(terrno);
×
3877
  }
3878

3879
  for (int i = 0; i < nCols; ++i) {
×
3880
    if (!taosArrayPush(aColArray, &aCols[i])) {
×
3881
      taosArrayDestroy(pColArray);
×
3882

3883
      TAOS_RETURN(terrno);
×
3884
    }
3885
  }
3886

3887
  STsdbRowKey lastRowKey = {.key.ts = TSKEY_MAX};
×
3888

3889
  // inverse iterator
3890
  CacheNextRowIter iter = {0};
×
3891
  code =
3892
      nextRowIterOpen(&iter, uid, pTsdb, pTSchema, pr->info.suid, pr->pLDataIterArray, pr->pReadSnap, pr->lastTs, pr);
×
3893
  TAOS_CHECK_GOTO(code, &lino, _err);
×
3894

3895
  do {
3896
    TSDBROW *pRow = NULL;
×
3897
    code = nextRowIterGet(&iter, &pRow, &ignoreEarlierTs, true, TARRAY_DATA(aColArray), TARRAY_SIZE(aColArray));
×
3898

3899
    if (!pRow) {
×
3900
      break;
×
3901
    }
3902

3903
    hasRow = true;
×
3904

3905
    int32_t sversion = TSDBROW_SVERSION(pRow);
×
3906
    if (sversion != -1) {
×
3907
      TAOS_CHECK_GOTO(updateTSchema(sversion, pr, uid), &lino, _err);
×
3908

3909
      pTSchema = pr->pCurrSchema;
×
3910
    }
3911
    // int16_t nCol = pTSchema->numOfCols;
3912

3913
    STsdbRowKey rowKey = {0};
×
3914
    tsdbRowGetKey(pRow, &rowKey);
×
3915

3916
    if (lastRowKey.key.ts == TSKEY_MAX) {  // first time
×
3917
      lastRowKey = rowKey;
×
3918

3919
      for (int16_t iCol = noneCol; iCol < nCols; ++iCol) {
×
3920
        if (iCol >= nLastCol) {
×
3921
          break;
×
3922
        }
3923
        SLastCol *pCol = taosArrayGet(pColArray, iCol);
×
3924
        if (slotIds[iCol] > pTSchema->numOfCols - 1) {
×
3925
          if (!setNoneCol) {
×
3926
            noneCol = iCol;
×
3927
            setNoneCol = true;
×
3928
          }
3929
          continue;
×
3930
        }
3931
        if (pCol->colVal.cid != pTSchema->columns[slotIds[iCol]].colId) {
×
3932
          continue;
×
3933
        }
3934
        if (slotIds[iCol] == 0) {
×
3935
          STColumn *pTColumn = &pTSchema->columns[0];
×
3936
          SValue    val = {.type = pTColumn->type};
×
3937
          VALUE_SET_TRIVIAL_DATUM(&val, rowKey.key.ts);
×
3938
          *pColVal = COL_VAL_VALUE(pTColumn->colId, val);
×
3939

3940
          SLastCol colTmp = {.rowKey = rowKey.key, .colVal = *pColVal, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
3941
          TAOS_CHECK_GOTO(tsdbCacheReallocSLastCol(&colTmp, NULL), &lino, _err);
×
3942

3943
          taosArraySet(pColArray, 0, &colTmp);
×
3944
          continue;
×
3945
        }
3946
        tsdbRowGetColVal(pRow, pTSchema, slotIds[iCol], pColVal);
×
3947

3948
        *pCol = (SLastCol){.rowKey = rowKey.key, .colVal = *pColVal, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
3949
        TAOS_CHECK_GOTO(tsdbCacheReallocSLastCol(pCol, NULL), &lino, _err);
×
3950

3951
        if (!COL_VAL_IS_VALUE(pColVal)) {
×
3952
          if (!setNoneCol) {
×
3953
            noneCol = iCol;
×
3954
            setNoneCol = true;
×
3955
          }
3956
        } else {
3957
          int32_t aColIndex = taosArraySearchIdx(aColArray, &pColVal->cid, compareInt16Val, TD_EQ);
×
3958
          if (aColIndex >= 0) {
×
3959
            taosArrayRemove(aColArray, aColIndex);
×
3960
          }
3961
        }
3962
      }
3963
      if (!setNoneCol) {
×
3964
        // done, goto return pColArray
3965
        break;
×
3966
      } else {
3967
        continue;
×
3968
      }
3969
    }
3970

3971
    // merge into pColArray
3972
    setNoneCol = false;
×
3973
    for (int16_t iCol = noneCol; iCol < nCols; ++iCol) {
×
3974
      if (iCol >= nLastCol) {
×
3975
        break;
×
3976
      }
3977
      // high version's column value
3978
      if (slotIds[iCol] > pTSchema->numOfCols - 1) {
×
3979
        continue;
×
3980
      }
3981

3982
      SLastCol *lastColVal = (SLastCol *)taosArrayGet(pColArray, iCol);
×
3983
      if (lastColVal->colVal.cid != pTSchema->columns[slotIds[iCol]].colId) {
×
3984
        continue;
×
3985
      }
3986
      SColVal *tColVal = &lastColVal->colVal;
×
3987
      if (COL_VAL_IS_VALUE(tColVal)) continue;
×
3988

3989
      tsdbRowGetColVal(pRow, pTSchema, slotIds[iCol], pColVal);
×
3990
      if (COL_VAL_IS_VALUE(pColVal)) {
×
3991
        SLastCol lastCol = {.rowKey = rowKey.key, .colVal = *pColVal, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
3992
        TAOS_CHECK_GOTO(tsdbCacheReallocSLastCol(&lastCol, NULL), &lino, _err);
×
3993

3994
        tsdbCacheFreeSLastColItem(lastColVal);
×
3995
        taosArraySet(pColArray, iCol, &lastCol);
×
3996
        int32_t aColIndex = taosArraySearchIdx(aColArray, &lastCol.colVal.cid, compareInt16Val, TD_EQ);
×
3997
        if (aColIndex >= 0) {
×
3998
          taosArrayRemove(aColArray, aColIndex);
×
3999
        }
4000
      } else if (!COL_VAL_IS_VALUE(pColVal) && !setNoneCol) {
×
4001
        noneCol = iCol;
×
4002
        setNoneCol = true;
×
4003
      }
4004
    }
4005
  } while (setNoneCol);
×
4006

4007
  if (!hasRow) {
×
4008
    if (ignoreEarlierTs) {
×
4009
      taosArrayDestroy(pColArray);
×
4010
      pColArray = NULL;
×
4011
    } else {
4012
      taosArrayClear(pColArray);
×
4013
    }
4014
  }
4015
  *ppLastArray = pColArray;
×
4016

4017
  nextRowIterClose(&iter);
×
4018
  taosArrayDestroy(aColArray);
×
4019

4020
  TAOS_RETURN(code);
×
4021

4022
_err:
×
4023
  nextRowIterClose(&iter);
×
4024
  // taosMemoryFreeClear(pTSchema);
4025
  *ppLastArray = NULL;
×
4026
  taosArrayDestroyEx(pColArray, tsdbCacheFreeSLastColItem);
×
4027
  taosArrayDestroy(aColArray);
×
4028

4029
  if (code) {
×
4030
    tsdbError("tsdb/cache: vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, lino,
×
4031
              tstrerror(code));
4032
  }
4033

4034
  TAOS_RETURN(code);
×
4035
}
4036

4037
static int32_t mergeLastRowCid(tb_uid_t uid, STsdb *pTsdb, SArray **ppLastArray, SCacheRowsReader *pr, int16_t *aCols,
×
4038
                               int nCols, int16_t *slotIds) {
4039
  int32_t   code = 0, lino = 0;
×
4040
  STSchema *pTSchema = pr->pSchema;  // metaGetTbTSchema(pTsdb->pVnode->pMeta, uid, -1, 1);
×
4041
  int16_t   nLastCol = nCols;
×
4042
  int16_t   noneCol = 0;
×
4043
  bool      setNoneCol = false;
×
4044
  bool      hasRow = false;
×
4045
  bool      ignoreEarlierTs = false;
×
4046
  SArray   *pColArray = NULL;
×
4047
  SColVal  *pColVal = &(SColVal){0};
×
4048

4049
  TAOS_CHECK_RETURN(initLastColArrayPartial(pTSchema, &pColArray, slotIds, nCols));
×
4050

4051
  SArray *aColArray = taosArrayInit(nCols, sizeof(int16_t));
×
4052
  if (NULL == aColArray) {
×
4053
    taosArrayDestroy(pColArray);
×
4054

4055
    TAOS_RETURN(terrno);
×
4056
  }
4057

4058
  for (int i = 0; i < nCols; ++i) {
×
4059
    if (!taosArrayPush(aColArray, &aCols[i])) {
×
4060
      taosArrayDestroy(pColArray);
×
4061

4062
      TAOS_RETURN(terrno);
×
4063
    }
4064
  }
4065

4066
  // inverse iterator
4067
  CacheNextRowIter iter = {0};
×
4068
  code =
4069
      nextRowIterOpen(&iter, uid, pTsdb, pTSchema, pr->info.suid, pr->pLDataIterArray, pr->pReadSnap, pr->lastTs, pr);
×
4070
  TAOS_CHECK_GOTO(code, &lino, _err);
×
4071

4072
  do {
4073
    TSDBROW *pRow = NULL;
×
4074
    code = nextRowIterGet(&iter, &pRow, &ignoreEarlierTs, false, TARRAY_DATA(aColArray), TARRAY_SIZE(aColArray));
×
4075

4076
    if (!pRow) {
×
4077
      break;
×
4078
    }
4079

4080
    hasRow = true;
×
4081

4082
    int32_t sversion = TSDBROW_SVERSION(pRow);
×
4083
    if (sversion != -1) {
×
4084
      TAOS_CHECK_GOTO(updateTSchema(sversion, pr, uid), &lino, _err);
×
4085

4086
      pTSchema = pr->pCurrSchema;
×
4087
    }
4088
    // int16_t nCol = pTSchema->numOfCols;
4089

4090
    STsdbRowKey rowKey = {0};
×
4091
    tsdbRowGetKey(pRow, &rowKey);
×
4092

4093
    for (int16_t iCol = noneCol; iCol < nCols; ++iCol) {
×
4094
      if (iCol >= nLastCol) {
×
4095
        break;
×
4096
      }
4097
      SLastCol *pCol = taosArrayGet(pColArray, iCol);
×
4098
      if (slotIds[iCol] > pTSchema->numOfCols - 1) {
×
4099
        continue;
×
4100
      }
4101
      if (pCol->colVal.cid != pTSchema->columns[slotIds[iCol]].colId) {
×
4102
        continue;
×
4103
      }
4104
      if (slotIds[iCol] == 0) {
×
4105
        STColumn *pTColumn = &pTSchema->columns[0];
×
4106
        SValue    val = {.type = pTColumn->type};
×
4107
        VALUE_SET_TRIVIAL_DATUM(&val, rowKey.key.ts);
×
4108
        *pColVal = COL_VAL_VALUE(pTColumn->colId, val);
×
4109

4110
        SLastCol colTmp = {.rowKey = rowKey.key, .colVal = *pColVal, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
4111
        TAOS_CHECK_GOTO(tsdbCacheReallocSLastCol(&colTmp, NULL), &lino, _err);
×
4112

4113
        taosArraySet(pColArray, 0, &colTmp);
×
4114
        continue;
×
4115
      }
4116
      tsdbRowGetColVal(pRow, pTSchema, slotIds[iCol], pColVal);
×
4117

4118
      *pCol = (SLastCol){.rowKey = rowKey.key, .colVal = *pColVal, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
4119
      TAOS_CHECK_GOTO(tsdbCacheReallocSLastCol(pCol, NULL), &lino, _err);
×
4120

4121
      int32_t aColIndex = taosArraySearchIdx(aColArray, &pColVal->cid, compareInt16Val, TD_EQ);
×
4122
      if (aColIndex >= 0) {
×
4123
        taosArrayRemove(aColArray, aColIndex);
×
4124
      }
4125
    }
4126

4127
    break;
×
4128
  } while (1);
4129

4130
  if (!hasRow) {
×
4131
    if (ignoreEarlierTs) {
×
4132
      taosArrayDestroy(pColArray);
×
4133
      pColArray = NULL;
×
4134
    } else {
4135
      taosArrayClear(pColArray);
×
4136
    }
4137
  }
4138
  *ppLastArray = pColArray;
×
4139

4140
  nextRowIterClose(&iter);
×
4141
  taosArrayDestroy(aColArray);
×
4142

4143
  TAOS_RETURN(code);
×
4144

4145
_err:
×
4146
  nextRowIterClose(&iter);
×
4147

4148
  *ppLastArray = NULL;
×
4149
  taosArrayDestroyEx(pColArray, tsdbCacheFreeSLastColItem);
×
4150
  taosArrayDestroy(aColArray);
×
4151

4152
  if (code) {
×
4153
    tsdbError("tsdb/cache: vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, lino,
×
4154
              tstrerror(code));
4155
  }
4156

4157
  TAOS_RETURN(code);
×
4158
}
4159

4160
void tsdbCacheRelease(SLRUCache *pCache, LRUHandle *h) { tsdbLRUCacheRelease(pCache, h, false); }
×
4161

4162
void tsdbCacheSetCapacity(SVnode *pVnode, size_t capacity) {
×
4163
  taosLRUCacheSetCapacity(pVnode->pTsdb->lruCache, capacity);
×
4164
}
×
4165

4166
#ifdef BUILD_NO_CALL
4167
size_t tsdbCacheGetCapacity(SVnode *pVnode) { return taosLRUCacheGetCapacity(pVnode->pTsdb->lruCache); }
4168
#endif
4169

4170
size_t tsdbCacheGetUsage(SVnode *pVnode) {
4✔
4171
  size_t usage = 0;
4✔
4172
  if (pVnode->pTsdb != NULL) {
4✔
4173
    usage = taosLRUCacheGetUsage(pVnode->pTsdb->lruCache);
4✔
4174
  }
4175

4176
  return usage;
4✔
4177
}
4178

4179
int32_t tsdbCacheGetElems(SVnode *pVnode) {
4✔
4180
  int32_t elems = 0;
4✔
4181
  if (pVnode->pTsdb != NULL) {
4✔
4182
    elems = taosLRUCacheGetElems(pVnode->pTsdb->lruCache);
4✔
4183
  }
4184

4185
  return elems;
4✔
4186
}
4187

4188
#ifdef USE_SHARED_STORAGE
4189
// block cache
4190
static void getBCacheKey(int32_t fid, int64_t commitID, int64_t blkno, char *key, int *len) {
×
4191
  struct {
4192
    int32_t fid;
4193
    int64_t commitID;
4194
    int64_t blkno;
4195
  } bKey = {0};
×
4196

4197
  bKey.fid = fid;
×
4198
  bKey.commitID = commitID;
×
4199
  bKey.blkno = blkno;
×
4200

4201
  *len = sizeof(bKey);
×
4202
  memcpy(key, &bKey, *len);
×
4203
}
×
4204

4205
static int32_t tsdbCacheLoadBlockSs(STsdbFD *pFD, uint8_t **ppBlock) {
×
4206
  int32_t code = 0;
×
4207

4208
  int64_t block_size = tsSsBlockSize * pFD->szPage;
×
4209
  int64_t block_offset = (pFD->blkno - 1) * block_size;
×
4210

4211
  char *buf = taosMemoryMalloc(block_size);
×
4212
  if (buf == NULL) {
×
4213
    code = TSDB_CODE_OUT_OF_MEMORY;
×
4214
    goto _exit;
×
4215
  }
4216

4217
  // TODO: pFD->objName is not initialized, but this function is never called.
4218
  code = tssReadFileFromDefault(pFD->objName, block_offset, buf, &block_size);
×
4219
  if (code != TSDB_CODE_SUCCESS) {
×
4220
    taosMemoryFree(buf);
×
4221
    goto _exit;
×
4222
  }
4223
  *ppBlock = buf;
×
4224

4225
_exit:
×
4226
  return code;
×
4227
}
4228

4229
static void deleteBCache(const void *key, size_t keyLen, void *value, void *ud) {
×
4230
  (void)ud;
4231
  uint8_t *pBlock = (uint8_t *)value;
×
4232

4233
  taosMemoryFree(pBlock);
×
4234
}
×
4235

4236
int32_t tsdbCacheGetBlockSs(SLRUCache *pCache, STsdbFD *pFD, LRUHandle **handle) {
×
4237
  int32_t code = 0;
×
4238
  char    key[128] = {0};
×
4239
  int     keyLen = 0;
×
4240

4241
  getBCacheKey(pFD->fid, pFD->cid, pFD->blkno, key, &keyLen);
×
4242
  LRUHandle *h = taosLRUCacheLookup(pCache, key, keyLen);
×
4243
  if (!h) {
×
4244
    STsdb *pTsdb = pFD->pTsdb;
×
4245
    (void)taosThreadMutexLock(&pTsdb->bMutex);
×
4246

4247
    h = taosLRUCacheLookup(pCache, key, keyLen);
×
4248
    if (!h) {
×
4249
      uint8_t *pBlock = NULL;
×
4250
      code = tsdbCacheLoadBlockSs(pFD, &pBlock);
×
4251
      //  if table's empty or error, return code of -1
4252
      if (code != TSDB_CODE_SUCCESS || pBlock == NULL) {
×
4253
        (void)taosThreadMutexUnlock(&pTsdb->bMutex);
×
4254

4255
        *handle = NULL;
×
4256
        if (code == TSDB_CODE_SUCCESS && !pBlock) {
×
4257
          code = TSDB_CODE_OUT_OF_MEMORY;
×
4258
        }
4259

4260
        TAOS_RETURN(code);
×
4261
      }
4262

4263
      size_t              charge = tsSsBlockSize * pFD->szPage;
×
4264
      _taos_lru_deleter_t deleter = deleteBCache;
×
4265
      LRUStatus           status =
4266
          taosLRUCacheInsert(pCache, key, keyLen, pBlock, charge, deleter, NULL, &h, TAOS_LRU_PRIORITY_LOW, NULL);
×
4267
      if (status != TAOS_LRU_STATUS_OK) {
4268
        // code = -1;
4269
      }
4270
    }
4271

4272
    (void)taosThreadMutexUnlock(&pTsdb->bMutex);
×
4273
  }
4274

4275
  *handle = h;
×
4276

4277
  TAOS_RETURN(code);
×
4278
}
4279

4280
int32_t tsdbCacheGetPageSs(SLRUCache *pCache, STsdbFD *pFD, int64_t pgno, LRUHandle **handle) {
×
4281
  if (!tsSsEnabled) {
×
4282
    return TSDB_CODE_OPS_NOT_SUPPORT;
×
4283
  }
4284

4285
  int32_t code = 0;
×
4286
  char    key[128] = {0};
×
4287
  int     keyLen = 0;
×
4288

4289
  getBCacheKey(pFD->fid, pFD->cid, pgno, key, &keyLen);
×
4290
  *handle = taosLRUCacheLookup(pCache, key, keyLen);
×
4291

4292
  return code;
×
4293
}
4294

4295
void tsdbCacheSetPageSs(SLRUCache *pCache, STsdbFD *pFD, int64_t pgno, uint8_t *pPage) {
×
4296
  if (!tsSsEnabled) {
×
4297
    return;
×
4298
  }
4299

4300
  char       key[128] = {0};
×
4301
  int        keyLen = 0;
×
4302
  LRUHandle *handle = NULL;
×
4303

4304
  getBCacheKey(pFD->fid, pFD->cid, pgno, key, &keyLen);
×
4305
  (void)taosThreadMutexLock(&pFD->pTsdb->pgMutex);
×
4306
  handle = taosLRUCacheLookup(pFD->pTsdb->pgCache, key, keyLen);
×
4307
  if (!handle) {
×
4308
    size_t              charge = pFD->szPage;
×
4309
    _taos_lru_deleter_t deleter = deleteBCache;
×
4310
    uint8_t            *pPg = taosMemoryMalloc(charge);
×
4311
    if (!pPg) {
×
4312
      (void)taosThreadMutexUnlock(&pFD->pTsdb->pgMutex);
×
4313

4314
      return;  // ignore error with ss cache and leave error untouched
×
4315
    }
4316
    memcpy(pPg, pPage, charge);
×
4317

4318
    LRUStatus status =
4319
        taosLRUCacheInsert(pCache, key, keyLen, pPg, charge, deleter, NULL, &handle, TAOS_LRU_PRIORITY_LOW, NULL);
×
4320
    if (status != TAOS_LRU_STATUS_OK) {
4321
      // ignore cache updating if not ok
4322
      // code = TSDB_CODE_OUT_OF_MEMORY;
4323
    }
4324
  }
4325
  (void)taosThreadMutexUnlock(&pFD->pTsdb->pgMutex);
×
4326

4327
  tsdbCacheRelease(pFD->pTsdb->pgCache, handle);
×
4328
}
4329
#endif
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc