• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #3599

08 Feb 2025 11:23AM UTC coverage: 1.77% (-61.6%) from 63.396%
#3599

push

travis-ci

web-flow
Merge pull request #29712 from taosdata/fix/TD-33652-3.0

fix: reduce write rows from 30w to 3w

3776 of 278949 branches covered (1.35%)

Branch coverage included in aggregate %.

6012 of 274147 relevant lines covered (2.19%)

1642.73 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

0.0
/source/dnode/vnode/src/tsdb/tsdbCache.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15
#include "functionMgt.h"
16
#include "tcs.h"
17
#include "tsdb.h"
18
#include "tsdbDataFileRW.h"
19
#include "tsdbIter.h"
20
#include "tsdbReadUtil.h"
21
#include "vnd.h"
22

23
#define ROCKS_BATCH_SIZE (4096)
24

25
void tsdbLRUCacheRelease(SLRUCache *cache, LRUHandle *handle, bool eraseIfLastRef) {
×
26
  if (!taosLRUCacheRelease(cache, handle, eraseIfLastRef)) {
×
27
    tsdbTrace(" release lru cache failed");
×
28
  }
29
}
×
30

31
static int32_t tsdbOpenBCache(STsdb *pTsdb) {
×
32
  int32_t    code = 0, lino = 0;
×
33
  int32_t    szPage = pTsdb->pVnode->config.tsdbPageSize;
×
34
  int64_t    szBlock = tsS3BlockSize <= 1024 ? 1024 : tsS3BlockSize;
×
35
  SLRUCache *pCache = taosLRUCacheInit((int64_t)tsS3BlockCacheSize * szBlock * szPage, 0, .5);
×
36
  if (pCache == NULL) {
×
37
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err);
×
38
  }
39

40
  taosLRUCacheSetStrictCapacity(pCache, false);
×
41

42
  (void)taosThreadMutexInit(&pTsdb->bMutex, NULL);
×
43

44
  pTsdb->bCache = pCache;
×
45

46
_err:
×
47
  if (code) {
×
48
    tsdbError("tsdb/bcache: vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, lino,
×
49
              tstrerror(code));
50
  }
51

52
  TAOS_RETURN(code);
×
53
}
54

55
static void tsdbCloseBCache(STsdb *pTsdb) {
×
56
  SLRUCache *pCache = pTsdb->bCache;
×
57
  if (pCache) {
×
58
    int32_t elems = taosLRUCacheGetElems(pCache);
×
59
    tsdbTrace("vgId:%d, elems: %d", TD_VID(pTsdb->pVnode), elems);
×
60
    taosLRUCacheEraseUnrefEntries(pCache);
×
61
    elems = taosLRUCacheGetElems(pCache);
×
62
    tsdbTrace("vgId:%d, elems: %d", TD_VID(pTsdb->pVnode), elems);
×
63

64
    taosLRUCacheCleanup(pCache);
×
65

66
    (void)taosThreadMutexDestroy(&pTsdb->bMutex);
×
67
  }
68
}
×
69

70
static int32_t tsdbOpenPgCache(STsdb *pTsdb) {
×
71
  int32_t code = 0, lino = 0;
×
72
  int32_t szPage = pTsdb->pVnode->config.tsdbPageSize;
×
73

74
  SLRUCache *pCache = taosLRUCacheInit((int64_t)tsS3PageCacheSize * szPage, 0, .5);
×
75
  if (pCache == NULL) {
×
76
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err);
×
77
  }
78

79
  taosLRUCacheSetStrictCapacity(pCache, false);
×
80

81
  (void)taosThreadMutexInit(&pTsdb->pgMutex, NULL);
×
82

83
  pTsdb->pgCache = pCache;
×
84

85
_err:
×
86
  if (code) {
×
87
    tsdbError("tsdb/pgcache: vgId:%d, open failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino, tstrerror(code));
×
88
  }
89

90
  TAOS_RETURN(code);
×
91
}
92

93
static void tsdbClosePgCache(STsdb *pTsdb) {
×
94
  SLRUCache *pCache = pTsdb->pgCache;
×
95
  if (pCache) {
×
96
    int32_t elems = taosLRUCacheGetElems(pCache);
×
97
    tsdbTrace("vgId:%d, elems: %d", TD_VID(pTsdb->pVnode), elems);
×
98
    taosLRUCacheEraseUnrefEntries(pCache);
×
99
    elems = taosLRUCacheGetElems(pCache);
×
100
    tsdbTrace("vgId:%d, elems: %d", TD_VID(pTsdb->pVnode), elems);
×
101

102
    taosLRUCacheCleanup(pCache);
×
103

104
    (void)taosThreadMutexDestroy(&pTsdb->bMutex);
×
105
  }
106
}
×
107

108
#define ROCKS_KEY_LEN (sizeof(tb_uid_t) + sizeof(int16_t) + sizeof(int8_t))
109

110
enum {
111
  LFLAG_LAST_ROW = 0,
112
  LFLAG_LAST = 1,
113
};
114

115
typedef struct {
116
  tb_uid_t uid;
117
  int16_t  cid;
118
  int8_t   lflag;
119
} SLastKey;
120

121
#define IS_LAST_ROW_KEY(k) (((k).lflag & LFLAG_LAST) == LFLAG_LAST_ROW)
122
#define IS_LAST_KEY(k)     (((k).lflag & LFLAG_LAST) == LFLAG_LAST)
123

124
static void tsdbGetRocksPath(STsdb *pTsdb, char *path) {
×
125
  SVnode *pVnode = pTsdb->pVnode;
×
126
  vnodeGetPrimaryDir(pTsdb->path, pVnode->diskPrimary, pVnode->pTfs, path, TSDB_FILENAME_LEN);
×
127

128
  int32_t offset = strlen(path);
×
129
  snprintf(path + offset, TSDB_FILENAME_LEN - offset - 1, "%scache.rdb", TD_DIRSEP);
×
130
}
×
131

132
static const char *myCmpName(void *state) {
×
133
  (void)state;
134
  return "myCmp";
×
135
}
136

137
static void myCmpDestroy(void *state) { (void)state; }
×
138

139
static int myCmp(void *state, const char *a, size_t alen, const char *b, size_t blen) {
×
140
  (void)state;
141
  (void)alen;
142
  (void)blen;
143
  SLastKey *lhs = (SLastKey *)a;
×
144
  SLastKey *rhs = (SLastKey *)b;
×
145

146
  if (lhs->uid < rhs->uid) {
×
147
    return -1;
×
148
  } else if (lhs->uid > rhs->uid) {
×
149
    return 1;
×
150
  }
151

152
  if (lhs->cid < rhs->cid) {
×
153
    return -1;
×
154
  } else if (lhs->cid > rhs->cid) {
×
155
    return 1;
×
156
  }
157

158
  if ((lhs->lflag & LFLAG_LAST) < (rhs->lflag & LFLAG_LAST)) {
×
159
    return -1;
×
160
  } else if ((lhs->lflag & LFLAG_LAST) > (rhs->lflag & LFLAG_LAST)) {
×
161
    return 1;
×
162
  }
163

164
  return 0;
×
165
}
166

167
static int32_t tsdbOpenRocksCache(STsdb *pTsdb) {
×
168
  int32_t code = 0, lino = 0;
×
169

170
  rocksdb_comparator_t *cmp = rocksdb_comparator_create(NULL, myCmpDestroy, myCmp, myCmpName);
×
171
  if (NULL == cmp) {
×
172
    TAOS_RETURN(TSDB_CODE_OUT_OF_MEMORY);
×
173
  }
174

175
  rocksdb_block_based_table_options_t *tableoptions = rocksdb_block_based_options_create();
×
176
  pTsdb->rCache.tableoptions = tableoptions;
×
177

178
  rocksdb_options_t *options = rocksdb_options_create();
×
179
  if (NULL == options) {
×
180
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err);
×
181
  }
182

183
  rocksdb_options_set_create_if_missing(options, 1);
×
184
  rocksdb_options_set_comparator(options, cmp);
×
185
  rocksdb_options_set_block_based_table_factory(options, tableoptions);
×
186
  rocksdb_options_set_info_log_level(options, 2);  // WARN_LEVEL
×
187
  // rocksdb_options_set_inplace_update_support(options, 1);
188
  // rocksdb_options_set_allow_concurrent_memtable_write(options, 0);
189

190
  rocksdb_writeoptions_t *writeoptions = rocksdb_writeoptions_create();
×
191
  if (NULL == writeoptions) {
×
192
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err2);
×
193
  }
194
  rocksdb_writeoptions_disable_WAL(writeoptions, 1);
×
195

196
  rocksdb_readoptions_t *readoptions = rocksdb_readoptions_create();
×
197
  if (NULL == readoptions) {
×
198
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err3);
×
199
  }
200

201
  char *err = NULL;
×
202
  char  cachePath[TSDB_FILENAME_LEN] = {0};
×
203
  tsdbGetRocksPath(pTsdb, cachePath);
×
204

205
  rocksdb_t *db = rocksdb_open(options, cachePath, &err);
×
206
  if (NULL == db) {
×
207
    tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, err);
×
208
    rocksdb_free(err);
×
209

210
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err4);
×
211
  }
212

213
  rocksdb_flushoptions_t *flushoptions = rocksdb_flushoptions_create();
×
214
  if (NULL == flushoptions) {
×
215
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err5);
×
216
  }
217

218
  rocksdb_writebatch_t *writebatch = rocksdb_writebatch_create();
×
219

220
  TAOS_CHECK_GOTO(taosThreadMutexInit(&pTsdb->rCache.writeBatchMutex, NULL), &lino, _err6);
×
221

222
  pTsdb->rCache.writebatch = writebatch;
×
223
  pTsdb->rCache.my_comparator = cmp;
×
224
  pTsdb->rCache.options = options;
×
225
  pTsdb->rCache.writeoptions = writeoptions;
×
226
  pTsdb->rCache.readoptions = readoptions;
×
227
  pTsdb->rCache.flushoptions = flushoptions;
×
228
  pTsdb->rCache.db = db;
×
229
  pTsdb->rCache.sver = -1;
×
230
  pTsdb->rCache.suid = -1;
×
231
  pTsdb->rCache.uid = -1;
×
232
  pTsdb->rCache.pTSchema = NULL;
×
233
  pTsdb->rCache.ctxArray = taosArrayInit(16, sizeof(SLastUpdateCtx));
×
234
  if (!pTsdb->rCache.ctxArray) {
×
235
    TAOS_CHECK_GOTO(terrno, &lino, _err7);
×
236
  }
237

238
  TAOS_RETURN(code);
×
239

240
_err7:
×
241
  (void)taosThreadMutexDestroy(&pTsdb->rCache.writeBatchMutex);
×
242
_err6:
×
243
  rocksdb_writebatch_destroy(writebatch);
×
244
_err5:
×
245
  rocksdb_close(pTsdb->rCache.db);
×
246
_err4:
×
247
  rocksdb_readoptions_destroy(readoptions);
×
248
_err3:
×
249
  rocksdb_writeoptions_destroy(writeoptions);
×
250
_err2:
×
251
  rocksdb_options_destroy(options);
×
252
  rocksdb_block_based_options_destroy(tableoptions);
×
253
_err:
×
254
  rocksdb_comparator_destroy(cmp);
×
255

256
  TAOS_RETURN(code);
×
257
}
258

259
static void tsdbCloseRocksCache(STsdb *pTsdb) {
×
260
  rocksdb_close(pTsdb->rCache.db);
×
261
  (void)taosThreadMutexDestroy(&pTsdb->rCache.writeBatchMutex);
×
262
  rocksdb_flushoptions_destroy(pTsdb->rCache.flushoptions);
×
263
  rocksdb_writebatch_destroy(pTsdb->rCache.writebatch);
×
264
  rocksdb_readoptions_destroy(pTsdb->rCache.readoptions);
×
265
  rocksdb_writeoptions_destroy(pTsdb->rCache.writeoptions);
×
266
  rocksdb_options_destroy(pTsdb->rCache.options);
×
267
  rocksdb_block_based_options_destroy(pTsdb->rCache.tableoptions);
×
268
  rocksdb_comparator_destroy(pTsdb->rCache.my_comparator);
×
269
  taosMemoryFree(pTsdb->rCache.pTSchema);
×
270
  taosArrayDestroy(pTsdb->rCache.ctxArray);
×
271
}
×
272

273
static void rocksMayWrite(STsdb *pTsdb, bool force) {
×
274
  rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
×
275

276
  int count = rocksdb_writebatch_count(wb);
×
277
  if ((force && count > 0) || count >= ROCKS_BATCH_SIZE) {
×
278
    char *err = NULL;
×
279

280
    rocksdb_write(pTsdb->rCache.db, pTsdb->rCache.writeoptions, wb, &err);
×
281
    if (NULL != err) {
×
282
      tsdbError("vgId:%d, %s failed at line %d, count: %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, count,
×
283
                err);
284
      rocksdb_free(err);
×
285
    }
286

287
    rocksdb_writebatch_clear(wb);
×
288
  }
289
}
×
290

291
typedef struct {
292
  TSKEY  ts;
293
  int8_t dirty;
294
  struct {
295
    int16_t cid;
296
    int8_t  type;
297
    int8_t  flag;
298
    union {
299
      int64_t val;
300
      struct {
301
        uint32_t nData;
302
        uint8_t *pData;
303
      };
304
    } value;
305
  } colVal;
306
} SLastColV0;
307

308
static int32_t tsdbCacheDeserializeV0(char const *value, SLastCol *pLastCol) {
×
309
  SLastColV0 *pLastColV0 = (SLastColV0 *)value;
×
310

311
  pLastCol->rowKey.ts = pLastColV0->ts;
×
312
  pLastCol->rowKey.numOfPKs = 0;
×
313
  pLastCol->dirty = pLastColV0->dirty;
×
314
  pLastCol->colVal.cid = pLastColV0->colVal.cid;
×
315
  pLastCol->colVal.flag = pLastColV0->colVal.flag;
×
316
  pLastCol->colVal.value.type = pLastColV0->colVal.type;
×
317

318
  pLastCol->cacheStatus = TSDB_LAST_CACHE_VALID;
×
319

320
  if (IS_VAR_DATA_TYPE(pLastCol->colVal.value.type)) {
×
321
    pLastCol->colVal.value.nData = pLastColV0->colVal.value.nData;
×
322
    pLastCol->colVal.value.pData = NULL;
×
323
    if (pLastCol->colVal.value.nData > 0) {
×
324
      pLastCol->colVal.value.pData = (uint8_t *)(&pLastColV0[1]);
×
325
    }
326
    return sizeof(SLastColV0) + pLastColV0->colVal.value.nData;
×
327
  } else {
328
    pLastCol->colVal.value.val = pLastColV0->colVal.value.val;
×
329
    return sizeof(SLastColV0);
×
330
  }
331
}
332

333
static int32_t tsdbCacheDeserialize(char const *value, size_t size, SLastCol **ppLastCol) {
×
334
  if (!value) {
×
335
    return TSDB_CODE_INVALID_PARA;
×
336
  }
337

338
  SLastCol *pLastCol = taosMemoryCalloc(1, sizeof(SLastCol));
×
339
  if (NULL == pLastCol) {
×
340
    return terrno;
×
341
  }
342

343
  int32_t offset = tsdbCacheDeserializeV0(value, pLastCol);
×
344
  if (offset == size) {
×
345
    // version 0
346
    *ppLastCol = pLastCol;
×
347

348
    TAOS_RETURN(TSDB_CODE_SUCCESS);
×
349
  } else if (offset > size) {
×
350
    taosMemoryFreeClear(pLastCol);
×
351

352
    TAOS_RETURN(TSDB_CODE_INVALID_DATA_FMT);
×
353
  }
354

355
  // version
356
  int8_t version = *(int8_t *)(value + offset);
×
357
  offset += sizeof(int8_t);
×
358

359
  // numOfPKs
360
  pLastCol->rowKey.numOfPKs = *(uint8_t *)(value + offset);
×
361
  offset += sizeof(uint8_t);
×
362

363
  // pks
364
  for (int32_t i = 0; i < pLastCol->rowKey.numOfPKs; i++) {
×
365
    pLastCol->rowKey.pks[i] = *(SValue *)(value + offset);
×
366
    offset += sizeof(SValue);
×
367

368
    if (IS_VAR_DATA_TYPE(pLastCol->rowKey.pks[i].type)) {
×
369
      pLastCol->rowKey.pks[i].pData = NULL;
×
370
      if (pLastCol->rowKey.pks[i].nData > 0) {
×
371
        pLastCol->rowKey.pks[i].pData = (uint8_t *)value + offset;
×
372
        offset += pLastCol->rowKey.pks[i].nData;
×
373
      }
374
    }
375
  }
376

377
  if (version >= LAST_COL_VERSION_2) {
×
378
    pLastCol->cacheStatus = *(uint8_t *)(value + offset);
×
379
  }
380

381
  if (offset > size) {
×
382
    taosMemoryFreeClear(pLastCol);
×
383

384
    TAOS_RETURN(TSDB_CODE_INVALID_DATA_FMT);
×
385
  }
386

387
  *ppLastCol = pLastCol;
×
388

389
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
390
}
391

392
/*
393
typedef struct {
394
  SLastColV0 lastColV0;
395
  char       colData[];
396
  int8_t     version;
397
  uint8_t    numOfPKs;
398
  SValue     pks[0];
399
  char       pk0Data[];
400
  SValue     pks[1];
401
  char       pk1Data[];
402
  ...
403
} SLastColDisk;
404
*/
405
static int32_t tsdbCacheSerializeV0(char const *value, SLastCol *pLastCol) {
×
406
  SLastColV0 *pLastColV0 = (SLastColV0 *)value;
×
407

408
  pLastColV0->ts = pLastCol->rowKey.ts;
×
409
  pLastColV0->dirty = pLastCol->dirty;
×
410
  pLastColV0->colVal.cid = pLastCol->colVal.cid;
×
411
  pLastColV0->colVal.flag = pLastCol->colVal.flag;
×
412
  pLastColV0->colVal.type = pLastCol->colVal.value.type;
×
413
  if (IS_VAR_DATA_TYPE(pLastCol->colVal.value.type)) {
×
414
    pLastColV0->colVal.value.nData = pLastCol->colVal.value.nData;
×
415
    if (pLastCol->colVal.value.nData > 0) {
×
416
      memcpy(&pLastColV0[1], pLastCol->colVal.value.pData, pLastCol->colVal.value.nData);
×
417
    }
418
    return sizeof(SLastColV0) + pLastCol->colVal.value.nData;
×
419
  } else {
420
    pLastColV0->colVal.value.val = pLastCol->colVal.value.val;
×
421
    return sizeof(SLastColV0);
×
422
  }
423

424
  return 0;
425
}
426

427
static int32_t tsdbCacheSerialize(SLastCol *pLastCol, char **value, size_t *size) {
×
428
  *size = sizeof(SLastColV0);
×
429
  if (IS_VAR_DATA_TYPE(pLastCol->colVal.value.type)) {
×
430
    *size += pLastCol->colVal.value.nData;
×
431
  }
432
  *size += sizeof(uint8_t) + sizeof(uint8_t) + sizeof(uint8_t);  // version + numOfPKs + cacheStatus
×
433

434
  for (int8_t i = 0; i < pLastCol->rowKey.numOfPKs; i++) {
×
435
    *size += sizeof(SValue);
×
436
    if (IS_VAR_DATA_TYPE(pLastCol->rowKey.pks[i].type)) {
×
437
      *size += pLastCol->rowKey.pks[i].nData;
×
438
    }
439
  }
440

441
  *value = taosMemoryMalloc(*size);
×
442
  if (NULL == *value) {
×
443
    TAOS_RETURN(terrno);
×
444
  }
445

446
  int32_t offset = tsdbCacheSerializeV0(*value, pLastCol);
×
447

448
  // version
449
  ((uint8_t *)(*value + offset))[0] = LAST_COL_VERSION;
×
450
  offset++;
×
451

452
  // numOfPKs
453
  ((uint8_t *)(*value + offset))[0] = pLastCol->rowKey.numOfPKs;
×
454
  offset++;
×
455

456
  // pks
457
  for (int8_t i = 0; i < pLastCol->rowKey.numOfPKs; i++) {
×
458
    ((SValue *)(*value + offset))[0] = pLastCol->rowKey.pks[i];
×
459
    offset += sizeof(SValue);
×
460
    if (IS_VAR_DATA_TYPE(pLastCol->rowKey.pks[i].type)) {
×
461
      if (pLastCol->rowKey.pks[i].nData > 0) {
×
462
        memcpy(*value + offset, pLastCol->rowKey.pks[i].pData, pLastCol->rowKey.pks[i].nData);
×
463
      }
464
      offset += pLastCol->rowKey.pks[i].nData;
×
465
    }
466
  }
467

468
  ((uint8_t *)(*value + offset))[0] = pLastCol->cacheStatus;
×
469

470
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
471
}
472

473
static int32_t tsdbCachePutToRocksdb(STsdb *pTsdb, SLastKey *pLastKey, SLastCol *pLastCol);
474

475
int tsdbCacheFlushDirty(const void *key, size_t klen, void *value, void *ud) {
×
476
  SLastCol *pLastCol = (SLastCol *)value;
×
477

478
  if (pLastCol->dirty) {
×
479
    STsdb *pTsdb = (STsdb *)ud;
×
480

481
    int32_t code = tsdbCachePutToRocksdb(pTsdb, (SLastKey *)key, pLastCol);
×
482
    if (code) {
×
483
      tsdbError("tsdb/cache: vgId:%d, flush dirty lru failed since %s.", TD_VID(pTsdb->pVnode), tstrerror(code));
×
484
      return code;
×
485
    }
486

487
    pLastCol->dirty = 0;
×
488

489
    rocksMayWrite(pTsdb, false);
×
490
  }
491

492
  return 0;
×
493
}
494

495
static bool tsdbKeyDeleted(TSDBKEY *key, SArray *pSkyline, int64_t *iSkyline) {
×
496
  bool deleted = false;
×
497
  while (*iSkyline > 0) {
×
498
    TSDBKEY *pItemBack = (TSDBKEY *)taosArrayGet(pSkyline, *iSkyline);
×
499
    TSDBKEY *pItemFront = (TSDBKEY *)taosArrayGet(pSkyline, *iSkyline - 1);
×
500

501
    if (key->ts > pItemBack->ts) {
×
502
      return false;
×
503
    } else if (key->ts >= pItemFront->ts && key->ts <= pItemBack->ts) {
×
504
      if (key->version <= pItemFront->version || (key->ts == pItemBack->ts && key->version <= pItemBack->version)) {
×
505
        // if (key->version <= pItemFront->version || key->version <= pItemBack->version) {
506
        return true;
×
507
      } else {
508
        if (*iSkyline > 1) {
×
509
          --*iSkyline;
×
510
        } else {
511
          return false;
×
512
        }
513
      }
514
    } else {
515
      if (*iSkyline > 1) {
×
516
        --*iSkyline;
×
517
      } else {
518
        return false;
×
519
      }
520
    }
521
  }
522

523
  return deleted;
×
524
}
525

526
// Get next non-deleted row from imem
527
static TSDBROW *tsdbImemGetNextRow(STbDataIter *pTbIter, SArray *pSkyline, int64_t *piSkyline) {
×
528
  int32_t code = 0;
×
529

530
  if (tsdbTbDataIterNext(pTbIter)) {
×
531
    TSDBROW *pMemRow = tsdbTbDataIterGet(pTbIter);
×
532
    TSDBKEY  rowKey = TSDBROW_KEY(pMemRow);
×
533
    bool     deleted = tsdbKeyDeleted(&rowKey, pSkyline, piSkyline);
×
534
    if (!deleted) {
×
535
      return pMemRow;
×
536
    }
537
  }
538

539
  return NULL;
×
540
}
541

542
// Get first non-deleted row from imem
543
static TSDBROW *tsdbImemGetFirstRow(SMemTable *imem, STbData *pIMem, STbDataIter *pTbIter, SArray *pSkyline,
×
544
                                    int64_t *piSkyline) {
545
  int32_t code = 0;
×
546

547
  tsdbTbDataIterOpen(pIMem, NULL, 1, pTbIter);
×
548
  TSDBROW *pMemRow = tsdbTbDataIterGet(pTbIter);
×
549
  if (pMemRow) {
×
550
    // if non deleted, return the found row.
551
    TSDBKEY rowKey = TSDBROW_KEY(pMemRow);
×
552
    bool    deleted = tsdbKeyDeleted(&rowKey, pSkyline, piSkyline);
×
553
    if (!deleted) {
×
554
      return pMemRow;
×
555
    }
556
  } else {
557
    return NULL;
×
558
  }
559

560
  // continue to find the non-deleted first row from imem, using get next row
561
  return tsdbImemGetNextRow(pTbIter, pSkyline, piSkyline);
×
562
}
563

564
void tsdbCacheInvalidateSchema(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, int32_t sver) {
×
565
  SRocksCache *pRCache = &pTsdb->rCache;
×
566
  if (!pRCache->pTSchema || sver <= pTsdb->rCache.sver) return;
×
567

568
  if (suid > 0 && suid == pRCache->suid) {
×
569
    pRCache->sver = -1;
×
570
    pRCache->suid = -1;
×
571
  }
572
  if (suid == 0 && uid == pRCache->uid) {
×
573
    pRCache->sver = -1;
×
574
    pRCache->uid = -1;
×
575
  }
576
}
577

578
static int32_t tsdbUpdateSkm(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, int32_t sver) {
×
579
  SRocksCache *pRCache = &pTsdb->rCache;
×
580
  if (pRCache->pTSchema && sver == pRCache->sver) {
×
581
    if (suid > 0 && suid == pRCache->suid) {
×
582
      return 0;
×
583
    }
584
    if (suid == 0 && uid == pRCache->uid) {
×
585
      return 0;
×
586
    }
587
  }
588

589
  pRCache->suid = suid;
×
590
  pRCache->uid = uid;
×
591
  pRCache->sver = sver;
×
592
  tDestroyTSchema(pRCache->pTSchema);
×
593
  return metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, uid, sver, &pRCache->pTSchema);
×
594
}
595

596
static int32_t tsdbCacheUpdate(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, SArray *updCtxArray);
597

598
int32_t tsdbLoadFromImem(SMemTable *imem, int64_t suid, int64_t uid) {
×
599
  int32_t     code = 0;
×
600
  int32_t     lino = 0;
×
601
  STsdb      *pTsdb = imem->pTsdb;
×
602
  SArray     *pMemDelData = NULL;
×
603
  SArray     *pSkyline = NULL;
×
604
  int64_t     iSkyline = 0;
×
605
  STbDataIter tbIter = {0};
×
606
  TSDBROW    *pMemRow = NULL;
×
607
  STSchema   *pTSchema = NULL;
×
608
  SSHashObj  *iColHash = NULL;
×
609
  int32_t     sver;
610
  int32_t     nCol;
611
  SArray     *ctxArray = pTsdb->rCache.ctxArray;
×
612
  STsdbRowKey tsdbRowKey = {0};
×
613
  STSDBRowIter iter = {0};
×
614

615
  STbData *pIMem = tsdbGetTbDataFromMemTable(imem, suid, uid);
×
616

617
  // load imem tomb data and build skyline
618
  TAOS_CHECK_GOTO(loadMemTombData(&pMemDelData, NULL, pIMem, INT64_MAX), &lino, _exit);
×
619

620
  // tsdbBuildDeleteSkyline
621
  size_t delSize = TARRAY_SIZE(pMemDelData);
×
622
  if (delSize > 0) {
×
623
    pSkyline = taosArrayInit(32, sizeof(TSDBKEY));
×
624
    if (!pSkyline) {
×
625
      TAOS_CHECK_EXIT(terrno);
×
626
    }
627

628
    TAOS_CHECK_EXIT(tsdbBuildDeleteSkyline(pMemDelData, 0, (int32_t)(delSize - 1), pSkyline));
×
629
    iSkyline = taosArrayGetSize(pSkyline) - 1;
×
630
  }
631

632
  pMemRow = tsdbImemGetFirstRow(imem, pIMem, &tbIter, pSkyline, &iSkyline);
×
633
  if (!pMemRow) {
×
634
    goto _exit;
×
635
  }
636

637
  // iter first row to last_row/last col values to ctxArray, and mark last null col ids
638
  sver = TSDBROW_SVERSION(pMemRow);
×
639
  TAOS_CHECK_GOTO(tsdbUpdateSkm(pTsdb, suid, uid, sver), &lino, _exit);
×
640
  pTSchema = pTsdb->rCache.pTSchema;
×
641
  nCol = pTSchema->numOfCols;
×
642

643
  tsdbRowGetKey(pMemRow, &tsdbRowKey);
×
644

645
  TAOS_CHECK_EXIT(tsdbRowIterOpen(&iter, pMemRow, pTSchema));
×
646

647
  int32_t iCol = 0;
×
648
  for (SColVal *pColVal = tsdbRowIterNext(&iter); pColVal && iCol < nCol; pColVal = tsdbRowIterNext(&iter), iCol++) {
×
649
    SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST_ROW, .tsdbRowKey = tsdbRowKey, .colVal = *pColVal};
×
650
    if (!taosArrayPush(ctxArray, &updateCtx)) {
×
651
      TAOS_CHECK_EXIT(terrno);
×
652
    }
653

654
    if (COL_VAL_IS_VALUE(pColVal)) {
×
655
      updateCtx.lflag = LFLAG_LAST;
×
656
      if (!taosArrayPush(ctxArray, &updateCtx)) {
×
657
        TAOS_CHECK_EXIT(terrno);
×
658
      }
659
    } else {
660
      if (!iColHash) {
×
661
        iColHash = tSimpleHashInit(16, taosGetDefaultHashFunction(TSDB_DATA_TYPE_SMALLINT));
×
662
        if (iColHash == NULL) {
×
663
          TAOS_CHECK_EXIT(terrno);
×
664
        }
665
      }
666

667
      if (tSimpleHashPut(iColHash, &pColVal->cid, sizeof(pColVal->cid), &pColVal->cid, sizeof(pColVal->cid))) {
×
668
        TAOS_CHECK_EXIT(terrno);
×
669
      }
670
    }
671
  }
672
  tsdbRowClose(&iter);
×
673

674
  // continue to get next row to fill null last col values
675
  pMemRow = tsdbImemGetNextRow(&tbIter, pSkyline, &iSkyline);
×
676
  while (pMemRow) {
×
677
    if (tSimpleHashGetSize(iColHash) == 0) {
×
678
      break;
×
679
    }
680

681
    sver = TSDBROW_SVERSION(pMemRow);
×
682
    TAOS_CHECK_EXIT(tsdbUpdateSkm(pTsdb, suid, uid, sver));
×
683
    pTSchema = pTsdb->rCache.pTSchema;
×
684

685
    STsdbRowKey tsdbRowKey = {0};
×
686
    tsdbRowGetKey(pMemRow, &tsdbRowKey);
×
687

688
    TAOS_CHECK_EXIT(tsdbRowIterOpen(&iter, pMemRow, pTSchema));
×
689

690
    int32_t iCol = 0;
×
691
    for (SColVal *pColVal = tsdbRowIterNext(&iter); pColVal && iCol < nCol; pColVal = tsdbRowIterNext(&iter), iCol++) {
×
692
      if (tSimpleHashGet(iColHash, &pColVal->cid, sizeof(pColVal->cid)) && COL_VAL_IS_VALUE(pColVal)) {
×
693
        SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST, .tsdbRowKey = tsdbRowKey, .colVal = *pColVal};
×
694
        if (!taosArrayPush(ctxArray, &updateCtx)) {
×
695
          TAOS_CHECK_EXIT(terrno);
×
696
        }
697

698
        TAOS_CHECK_EXIT(tSimpleHashRemove(iColHash, &pColVal->cid, sizeof(pColVal->cid)));
×
699
      }
700
    }
701
    tsdbRowClose(&iter);
×
702

703
    pMemRow = tsdbImemGetNextRow(&tbIter, pSkyline, &iSkyline);
×
704
  }
705

706
  TAOS_CHECK_GOTO(tsdbCacheUpdate(pTsdb, suid, uid, ctxArray), &lino, _exit);
×
707

708
_exit:
×
709
  if (code) {
×
710
    tsdbError("vgId:%d %s failed at %s:%d since %s", TD_VID(pTsdb->pVnode), __func__, __FILE__, lino, tstrerror(code));
×
711

712
    tsdbRowClose(&iter);
×
713
  }
714

715
  taosArrayClear(ctxArray);
×
716
  // destroy any allocated resource
717
  tSimpleHashCleanup(iColHash);
×
718
  if (pMemDelData) {
×
719
    taosArrayDestroy(pMemDelData);
×
720
  }
721
  if (pSkyline) {
×
722
    taosArrayDestroy(pSkyline);
×
723
  }
724

725
  TAOS_RETURN(code);
×
726
}
727

728
static int32_t tsdbCacheUpdateFromIMem(STsdb *pTsdb) {
×
729
  if (!pTsdb) return 0;
×
730
  if (!pTsdb->imem) return 0;
×
731

732
  int32_t    code = 0;
×
733
  int32_t    lino = 0;
×
734
  SMemTable *imem = pTsdb->imem;
×
735
  int32_t    nTbData = imem->nTbData;
×
736
  int64_t    nRow = imem->nRow;
×
737
  int64_t    nDel = imem->nDel;
×
738

739
  if (nRow == 0 || nTbData == 0) return 0;
×
740

741
  TAOS_CHECK_EXIT(tsdbMemTableSaveToCache(imem, tsdbLoadFromImem));
×
742

743
_exit:
×
744
  if (code) {
×
745
    tsdbError("vgId:%d %s failed at %s:%d since %s", TD_VID(pTsdb->pVnode), __func__, __FILE__, lino, tstrerror(code));
×
746
  } else {
747
    tsdbInfo("vgId:%d %s done, nRow:%" PRId64 " nDel:%" PRId64, TD_VID(pTsdb->pVnode), __func__, nRow, nDel);
×
748
  }
749

750
  TAOS_RETURN(code);
×
751
}
752

753
int32_t tsdbCacheCommit(STsdb *pTsdb) {
×
754
  int32_t code = 0;
×
755

756
  // 0, tsdbCacheUpdateFromIMem if updateCacheBatch
757
  // flush dirty data of lru into rocks
758
  // 4, and update when writing if !updateCacheBatch
759
  // 5, merge cache & mem if updateCacheBatch
760

761
  if (tsUpdateCacheBatch) {
×
762
    code = tsdbCacheUpdateFromIMem(pTsdb);
×
763
    if (code) {
×
764
      tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
765

766
      TAOS_RETURN(code);
×
767
    }
768
  }
769

770
  char                 *err = NULL;
×
771
  SLRUCache            *pCache = pTsdb->lruCache;
×
772
  rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
×
773

774
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
775

776
  taosLRUCacheApply(pCache, tsdbCacheFlushDirty, pTsdb);
×
777

778
  rocksMayWrite(pTsdb, true);
×
779
  rocksdb_flush(pTsdb->rCache.db, pTsdb->rCache.flushoptions, &err);
×
780

781
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
782

783
  if (NULL != err) {
×
784
    tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, err);
×
785
    rocksdb_free(err);
×
786
    code = TSDB_CODE_FAILED;
×
787
  }
788

789
  TAOS_RETURN(code);
×
790
}
791

792
static int32_t reallocVarDataVal(SValue *pValue) {
×
793
  if (IS_VAR_DATA_TYPE(pValue->type)) {
×
794
    uint8_t *pVal = pValue->pData;
×
795
    uint32_t nData = pValue->nData;
×
796
    if (nData > 0) {
×
797
      uint8_t *p = taosMemoryMalloc(nData);
×
798
      if (!p) {
×
799
        TAOS_RETURN(terrno);
×
800
      }
801
      pValue->pData = p;
×
802
      (void)memcpy(pValue->pData, pVal, nData);
×
803
    } else {
804
      pValue->pData = NULL;
×
805
    }
806
  }
807

808
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
809
}
810

811
static int32_t reallocVarData(SColVal *pColVal) { return reallocVarDataVal(&pColVal->value); }
×
812

813
// realloc pk data and col data.
814
static int32_t tsdbCacheReallocSLastCol(SLastCol *pCol, size_t *pCharge) {
×
815
  int32_t code = TSDB_CODE_SUCCESS, lino = 0;
×
816
  size_t  charge = sizeof(SLastCol);
×
817

818
  int8_t i = 0;
×
819
  for (; i < pCol->rowKey.numOfPKs; i++) {
×
820
    SValue *pValue = &pCol->rowKey.pks[i];
×
821
    if (IS_VAR_DATA_TYPE(pValue->type)) {
×
822
      TAOS_CHECK_EXIT(reallocVarDataVal(pValue));
×
823
      charge += pValue->nData;
×
824
    }
825
  }
826

827
  if (IS_VAR_DATA_TYPE(pCol->colVal.value.type)) {
×
828
    TAOS_CHECK_EXIT(reallocVarData(&pCol->colVal));
×
829
    charge += pCol->colVal.value.nData;
×
830
  }
831

832
  if (pCharge) {
×
833
    *pCharge = charge;
×
834
  }
835

836
_exit:
×
837
  if (TSDB_CODE_SUCCESS != code) {
×
838
    for (int8_t j = 0; j < i; j++) {
×
839
      if (IS_VAR_DATA_TYPE(pCol->rowKey.pks[j].type)) {
×
840
        taosMemoryFree(pCol->rowKey.pks[j].pData);
×
841
      }
842
    }
843

844
    (void)memset(pCol, 0, sizeof(SLastCol));
×
845
  }
846

847
  TAOS_RETURN(code);
×
848
}
849

850
void tsdbCacheFreeSLastColItem(void *pItem) {
×
851
  SLastCol *pCol = (SLastCol *)pItem;
×
852
  for (int i = 0; i < pCol->rowKey.numOfPKs; i++) {
×
853
    if (IS_VAR_DATA_TYPE(pCol->rowKey.pks[i].type)) {
×
854
      taosMemoryFree(pCol->rowKey.pks[i].pData);
×
855
    }
856
  }
857

858
  if (IS_VAR_DATA_TYPE(pCol->colVal.value.type) && pCol->colVal.value.pData) {
×
859
    taosMemoryFree(pCol->colVal.value.pData);
×
860
  }
861
}
×
862

863
static void tsdbCacheDeleter(const void *key, size_t klen, void *value, void *ud) {
×
864
  SLastCol *pLastCol = (SLastCol *)value;
×
865

866
  if (pLastCol->dirty) {
×
867
    if (tsdbCacheFlushDirty(key, klen, pLastCol, ud) != 0) {
×
868
      STsdb *pTsdb = (STsdb *)ud;
×
869
      tsdbTrace("tsdb/cache: vgId:%d, flush cache %s failed at line %d.", TD_VID(pTsdb->pVnode), __func__, __LINE__);
×
870
    }
871
  }
872

873
  for (uint8_t i = 0; i < pLastCol->rowKey.numOfPKs; ++i) {
×
874
    SValue *pValue = &pLastCol->rowKey.pks[i];
×
875
    if (IS_VAR_DATA_TYPE(pValue->type)) {
×
876
      taosMemoryFree(pValue->pData);
×
877
    }
878
  }
879

880
  if (IS_VAR_DATA_TYPE(pLastCol->colVal.value.type) /* && pLastCol->colVal.value.nData > 0*/) {
×
881
    taosMemoryFree(pLastCol->colVal.value.pData);
×
882
  }
883

884
  taosMemoryFree(value);
×
885
}
×
886

887
static void tsdbCacheOverWriter(const void *key, size_t klen, void *value, void *ud) {
×
888
  SLastCol *pLastCol = (SLastCol *)value;
×
889
  pLastCol->dirty = 0;
×
890
}
×
891

892
static int32_t tsdbCachePutToLRU(STsdb *pTsdb, SLastKey *pLastKey, SLastCol *pLastCol, int8_t dirty);
893

894
static int32_t tsdbCacheNewTableColumn(STsdb *pTsdb, int64_t uid, int16_t cid, int8_t col_type, int8_t lflag) {
×
895
  int32_t code = 0, lino = 0;
×
896

897
  SLRUCache            *pCache = pTsdb->lruCache;
×
898
  rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
×
899
  SRowKey               emptyRowKey = {.ts = TSKEY_MIN, .numOfPKs = 0};
×
900
  SLastCol              emptyCol = {
×
901
                   .rowKey = emptyRowKey, .colVal = COL_VAL_NONE(cid, col_type), .dirty = 1, .cacheStatus = TSDB_LAST_CACHE_VALID};
902

903
  SLastKey *pLastKey = &(SLastKey){.lflag = lflag, .uid = uid, .cid = cid};
×
904
  code = tsdbCachePutToLRU(pTsdb, pLastKey, &emptyCol, 1);
×
905
  if (code) {
×
906
    tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
907
  }
908

909
  TAOS_RETURN(code);
×
910
}
911

912
int32_t tsdbCacheCommitNoLock(STsdb *pTsdb) {
×
913
  int32_t code = 0;
×
914
  char   *err = NULL;
×
915

916
  SLRUCache            *pCache = pTsdb->lruCache;
×
917
  rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
×
918

919
  taosLRUCacheApply(pCache, tsdbCacheFlushDirty, pTsdb);
×
920

921
  rocksMayWrite(pTsdb, true);
×
922
  rocksdb_flush(pTsdb->rCache.db, pTsdb->rCache.flushoptions, &err);
×
923

924
  if (NULL != err) {
×
925
    tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, err);
×
926
    rocksdb_free(err);
×
927
    code = TSDB_CODE_FAILED;
×
928
  }
929

930
  TAOS_RETURN(code);
×
931
}
932

933
static int32_t tsdbCacheGetValuesFromRocks(STsdb *pTsdb, size_t numKeys, const char *const *ppKeysList,
×
934
                                           size_t *pKeysListSizes, char ***pppValuesList, size_t **ppValuesListSizes) {
935
  char **valuesList = taosMemoryCalloc(numKeys, sizeof(char *));
×
936
  if (!valuesList) return terrno;
×
937
  size_t *valuesListSizes = taosMemoryCalloc(numKeys, sizeof(size_t));
×
938
  if (!valuesListSizes) {
×
939
    taosMemoryFreeClear(valuesList);
×
940
    return terrno;
×
941
  }
942
  char **errs = taosMemoryCalloc(numKeys, sizeof(char *));
×
943
  if (!errs) {
×
944
    taosMemoryFreeClear(valuesList);
×
945
    taosMemoryFreeClear(valuesListSizes);
×
946
    return terrno;
×
947
  }
948
  rocksdb_multi_get(pTsdb->rCache.db, pTsdb->rCache.readoptions, numKeys, ppKeysList, pKeysListSizes, valuesList,
×
949
                    valuesListSizes, errs);
950
  for (size_t i = 0; i < numKeys; ++i) {
×
951
    rocksdb_free(errs[i]);
×
952
  }
953
  taosMemoryFreeClear(errs);
×
954

955
  *pppValuesList = valuesList;
×
956
  *ppValuesListSizes = valuesListSizes;
×
957
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
958
}
959

960
static int32_t tsdbCacheDropTableColumn(STsdb *pTsdb, int64_t uid, int16_t cid, bool hasPrimaryKey) {
×
961
  int32_t code = 0;
×
962

963
  // build keys & multi get from rocks
964
  char **keys_list = taosMemoryCalloc(2, sizeof(char *));
×
965
  if (!keys_list) {
×
966
    return terrno;
×
967
  }
968
  size_t *keys_list_sizes = taosMemoryCalloc(2, sizeof(size_t));
×
969
  if (!keys_list_sizes) {
×
970
    taosMemoryFree(keys_list);
×
971
    return terrno;
×
972
  }
973
  const size_t klen = ROCKS_KEY_LEN;
×
974

975
  char *keys = taosMemoryCalloc(2, sizeof(SLastKey));
×
976
  if (!keys) {
×
977
    taosMemoryFree(keys_list);
×
978
    taosMemoryFree(keys_list_sizes);
×
979
    return terrno;
×
980
  }
981
  ((SLastKey *)keys)[0] = (SLastKey){.lflag = LFLAG_LAST, .uid = uid, .cid = cid};
×
982
  ((SLastKey *)keys)[1] = (SLastKey){.lflag = LFLAG_LAST_ROW, .uid = uid, .cid = cid};
×
983

984
  keys_list[0] = keys;
×
985
  keys_list[1] = keys + sizeof(SLastKey);
×
986
  keys_list_sizes[0] = klen;
×
987
  keys_list_sizes[1] = klen;
×
988

989
  char  **values_list = NULL;
×
990
  size_t *values_list_sizes = NULL;
×
991

992
  // was written by caller
993
  // rocksMayWrite(pTsdb, true); // flush writebatch cache
994

995
  TAOS_CHECK_GOTO(tsdbCacheGetValuesFromRocks(pTsdb, 2, (const char *const *)keys_list, keys_list_sizes, &values_list,
×
996
                                              &values_list_sizes),
997
                  NULL, _exit);
998

999
  rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
×
1000
  {
1001
    SLastCol *pLastCol = NULL;
×
1002
    if (values_list[0] != NULL) {
×
1003
      code = tsdbCacheDeserialize(values_list[0], values_list_sizes[0], &pLastCol);
×
1004
      if (code != TSDB_CODE_SUCCESS) {
×
1005
        tsdbError("vgId:%d, %s deserialize failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1006
                  tstrerror(code));
1007
        goto _exit;
×
1008
      }
1009
      if (NULL != pLastCol) {
×
1010
        rocksdb_writebatch_delete(wb, keys_list[0], klen);
×
1011
      }
1012
      taosMemoryFreeClear(pLastCol);
×
1013
    }
1014

1015
    pLastCol = NULL;
×
1016
    if (values_list[1] != NULL) {
×
1017
      code = tsdbCacheDeserialize(values_list[1], values_list_sizes[1], &pLastCol);
×
1018
      if (code != TSDB_CODE_SUCCESS) {
×
1019
        tsdbError("vgId:%d, %s deserialize failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1020
                  tstrerror(code));
1021
        goto _exit;
×
1022
      }
1023
      if (NULL != pLastCol) {
×
1024
        rocksdb_writebatch_delete(wb, keys_list[1], klen);
×
1025
      }
1026
      taosMemoryFreeClear(pLastCol);
×
1027
    }
1028

1029
    rocksdb_free(values_list[0]);
×
1030
    rocksdb_free(values_list[1]);
×
1031

1032
    for (int i = 0; i < 2; i++) {
×
1033
      LRUHandle *h = taosLRUCacheLookup(pTsdb->lruCache, keys_list[i], klen);
×
1034
      if (h) {
×
1035
        tsdbLRUCacheRelease(pTsdb->lruCache, h, true);
×
1036
        taosLRUCacheErase(pTsdb->lruCache, keys_list[i], klen);
×
1037
      }
1038
    }
1039
  }
1040

1041
_exit:
×
1042
  taosMemoryFree(keys_list[0]);
×
1043

1044
  taosMemoryFree(keys_list);
×
1045
  taosMemoryFree(keys_list_sizes);
×
1046
  taosMemoryFree(values_list);
×
1047
  taosMemoryFree(values_list_sizes);
×
1048

1049
  TAOS_RETURN(code);
×
1050
}
1051

1052
int32_t tsdbCacheNewTable(STsdb *pTsdb, tb_uid_t uid, tb_uid_t suid, const SSchemaWrapper *pSchemaRow) {
×
1053
  int32_t code = 0;
×
1054

1055
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1056

1057
  if (suid < 0) {
×
1058
    for (int i = 0; i < pSchemaRow->nCols; ++i) {
×
1059
      int16_t cid = pSchemaRow->pSchema[i].colId;
×
1060
      int8_t  col_type = pSchemaRow->pSchema[i].type;
×
1061

1062
      code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, LFLAG_LAST_ROW);
×
1063
      if (code != TSDB_CODE_SUCCESS) {
×
1064
        tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1065
                  tstrerror(code));
1066
      }
1067
      code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, LFLAG_LAST);
×
1068
      if (code != TSDB_CODE_SUCCESS) {
×
1069
        tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1070
                  tstrerror(code));
1071
      }
1072
    }
1073
  } else {
1074
    STSchema *pTSchema = NULL;
×
1075
    code = metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, uid, -1, &pTSchema);
×
1076
    if (code != TSDB_CODE_SUCCESS) {
×
1077
      (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1078

1079
      TAOS_RETURN(code);
×
1080
    }
1081

1082
    for (int i = 0; i < pTSchema->numOfCols; ++i) {
×
1083
      int16_t cid = pTSchema->columns[i].colId;
×
1084
      int8_t  col_type = pTSchema->columns[i].type;
×
1085

1086
      code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, LFLAG_LAST_ROW);
×
1087
      if (code != TSDB_CODE_SUCCESS) {
×
1088
        tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1089
                  tstrerror(code));
1090
      }
1091
      code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, LFLAG_LAST);
×
1092
      if (code != TSDB_CODE_SUCCESS) {
×
1093
        tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1094
                  tstrerror(code));
1095
      }
1096
    }
1097

1098
    taosMemoryFree(pTSchema);
×
1099
  }
1100

1101
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1102

1103
  TAOS_RETURN(code);
×
1104
}
1105

1106
int32_t tsdbCacheDropTable(STsdb *pTsdb, tb_uid_t uid, tb_uid_t suid, SSchemaWrapper *pSchemaRow) {
×
1107
  int32_t code = 0;
×
1108

1109
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1110

1111
  code = tsdbCacheCommitNoLock(pTsdb);
×
1112
  if (code != TSDB_CODE_SUCCESS) {
×
1113
    tsdbTrace("vgId:%d, %s commit with no lock failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1114
              tstrerror(code));
1115
  }
1116

1117
  if (pSchemaRow != NULL) {
×
1118
    bool hasPrimayKey = false;
×
1119
    int  nCols = pSchemaRow->nCols;
×
1120
    if (nCols >= 2) {
×
1121
      hasPrimayKey = (pSchemaRow->pSchema[1].flags & COL_IS_KEY) ? true : false;
×
1122
    }
1123
    for (int i = 0; i < nCols; ++i) {
×
1124
      int16_t cid = pSchemaRow->pSchema[i].colId;
×
1125
      int8_t  col_type = pSchemaRow->pSchema[i].type;
×
1126

1127
      code = tsdbCacheDropTableColumn(pTsdb, uid, cid, hasPrimayKey);
×
1128
      if (code != TSDB_CODE_SUCCESS) {
×
1129
        tsdbTrace("vgId:%d, %s drop table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1130
                  tstrerror(code));
1131
      }
1132
    }
1133
  } else {
1134
    STSchema *pTSchema = NULL;
×
1135
    code = metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, uid, -1, &pTSchema);
×
1136
    if (code != TSDB_CODE_SUCCESS) {
×
1137
      (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1138

1139
      TAOS_RETURN(code);
×
1140
    }
1141

1142
    bool hasPrimayKey = false;
×
1143
    int  nCols = pTSchema->numOfCols;
×
1144
    if (nCols >= 2) {
×
1145
      hasPrimayKey = (pTSchema->columns[1].flags & COL_IS_KEY) ? true : false;
×
1146
    }
1147
    for (int i = 0; i < nCols; ++i) {
×
1148
      int16_t cid = pTSchema->columns[i].colId;
×
1149
      int8_t  col_type = pTSchema->columns[i].type;
×
1150

1151
      code = tsdbCacheDropTableColumn(pTsdb, uid, cid, hasPrimayKey);
×
1152
      if (code != TSDB_CODE_SUCCESS) {
×
1153
        tsdbTrace("vgId:%d, %s drop table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1154
                  tstrerror(code));
1155
      }
1156
    }
1157

1158
    taosMemoryFree(pTSchema);
×
1159
  }
1160

1161
  rocksMayWrite(pTsdb, false);
×
1162

1163
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1164

1165
  TAOS_RETURN(code);
×
1166
}
1167

1168
int32_t tsdbCacheDropSubTables(STsdb *pTsdb, SArray *uids, tb_uid_t suid) {
×
1169
  int32_t code = 0;
×
1170

1171
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1172

1173
  code = tsdbCacheCommitNoLock(pTsdb);
×
1174
  if (code != TSDB_CODE_SUCCESS) {
×
1175
    tsdbTrace("vgId:%d, %s commit with no lock failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1176
              tstrerror(code));
1177
  }
1178

1179
  STSchema *pTSchema = NULL;
×
1180
  code = metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, suid, -1, &pTSchema);
×
1181
  if (code != TSDB_CODE_SUCCESS) {
×
1182
    (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1183

1184
    TAOS_RETURN(code);
×
1185
  }
1186

1187
  for (int i = 0; i < TARRAY_SIZE(uids); ++i) {
×
1188
    int64_t uid = ((tb_uid_t *)TARRAY_DATA(uids))[i];
×
1189

1190
    bool hasPrimayKey = false;
×
1191
    int  nCols = pTSchema->numOfCols;
×
1192
    if (nCols >= 2) {
×
1193
      hasPrimayKey = (pTSchema->columns[1].flags & COL_IS_KEY) ? true : false;
×
1194
    }
1195

1196
    for (int i = 0; i < nCols; ++i) {
×
1197
      int16_t cid = pTSchema->columns[i].colId;
×
1198
      int8_t  col_type = pTSchema->columns[i].type;
×
1199

1200
      code = tsdbCacheDropTableColumn(pTsdb, uid, cid, hasPrimayKey);
×
1201
      if (code != TSDB_CODE_SUCCESS) {
×
1202
        tsdbTrace("vgId:%d, %s drop table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1203
                  tstrerror(code));
1204
      }
1205
    }
1206
  }
1207

1208
  taosMemoryFree(pTSchema);
×
1209

1210
  rocksMayWrite(pTsdb, false);
×
1211

1212
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1213

1214
  TAOS_RETURN(code);
×
1215
}
1216

1217
int32_t tsdbCacheNewNTableColumn(STsdb *pTsdb, int64_t uid, int16_t cid, int8_t col_type) {
×
1218
  int32_t code = 0;
×
1219

1220
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1221

1222
  code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, 0);
×
1223
  if (code != TSDB_CODE_SUCCESS) {
×
1224
    tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1225
              tstrerror(code));
1226
  }
1227
  code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, 1);
×
1228
  if (code != TSDB_CODE_SUCCESS) {
×
1229
    tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1230
              tstrerror(code));
1231
  }
1232
  // rocksMayWrite(pTsdb, true, false, false);
1233
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1234

1235
  TAOS_RETURN(code);
×
1236
}
1237

1238
int32_t tsdbCacheDropNTableColumn(STsdb *pTsdb, int64_t uid, int16_t cid, bool hasPrimayKey) {
×
1239
  int32_t code = 0;
×
1240

1241
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1242

1243
  code = tsdbCacheCommitNoLock(pTsdb);
×
1244
  if (code != TSDB_CODE_SUCCESS) {
×
1245
    tsdbTrace("vgId:%d, %s commit with no lock failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1246
              tstrerror(code));
1247
  }
1248

1249
  code = tsdbCacheDropTableColumn(pTsdb, uid, cid, hasPrimayKey);
×
1250
  if (code != TSDB_CODE_SUCCESS) {
×
1251
    tsdbTrace("vgId:%d, %s drop table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1252
              tstrerror(code));
1253
  }
1254

1255
  rocksMayWrite(pTsdb, false);
×
1256

1257
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1258

1259
  TAOS_RETURN(code);
×
1260
}
1261

1262
int32_t tsdbCacheNewSTableColumn(STsdb *pTsdb, SArray *uids, int16_t cid, int8_t col_type) {
×
1263
  int32_t code = 0;
×
1264

1265
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1266

1267
  for (int i = 0; i < TARRAY_SIZE(uids); ++i) {
×
1268
    tb_uid_t uid = ((tb_uid_t *)TARRAY_DATA(uids))[i];
×
1269

1270
    code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, 0);
×
1271
    if (code != TSDB_CODE_SUCCESS) {
×
1272
      tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1273
                tstrerror(code));
1274
    }
1275
    code = tsdbCacheNewTableColumn(pTsdb, uid, cid, col_type, 1);
×
1276
    if (code != TSDB_CODE_SUCCESS) {
×
1277
      tsdbTrace("vgId:%d, %s new table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1278
                tstrerror(code));
1279
    }
1280
  }
1281

1282
  // rocksMayWrite(pTsdb, true, false, false);
1283
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1284
  TAOS_RETURN(code);
×
1285
}
1286

1287
int32_t tsdbCacheDropSTableColumn(STsdb *pTsdb, SArray *uids, int16_t cid, bool hasPrimayKey) {
×
1288
  int32_t code = 0;
×
1289

1290
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1291

1292
  code = tsdbCacheCommitNoLock(pTsdb);
×
1293
  if (code != TSDB_CODE_SUCCESS) {
×
1294
    tsdbTrace("vgId:%d, %s commit with no lock failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1295
              tstrerror(code));
1296
  }
1297

1298
  for (int i = 0; i < TARRAY_SIZE(uids); ++i) {
×
1299
    int64_t uid = ((tb_uid_t *)TARRAY_DATA(uids))[i];
×
1300

1301
    code = tsdbCacheDropTableColumn(pTsdb, uid, cid, hasPrimayKey);
×
1302
    if (code != TSDB_CODE_SUCCESS) {
×
1303
      tsdbTrace("vgId:%d, %s drop table column failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1304
                tstrerror(code));
1305
    }
1306
  }
1307

1308
  rocksMayWrite(pTsdb, false);
×
1309

1310
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1311

1312
  TAOS_RETURN(code);
×
1313
}
1314

1315
typedef struct {
1316
  int      idx;
1317
  SLastKey key;
1318
} SIdxKey;
1319

1320
static void tsdbCacheUpdateLastColToNone(SLastCol *pLastCol, ELastCacheStatus cacheStatus) {
×
1321
  // update rowkey
1322
  pLastCol->rowKey.ts = TSKEY_MIN;
×
1323
  for (int8_t i = 0; i < pLastCol->rowKey.numOfPKs; i++) {
×
1324
    SValue *pPKValue = &pLastCol->rowKey.pks[i];
×
1325
    if (IS_VAR_DATA_TYPE(pPKValue->type) && pPKValue->nData > 0) {
×
1326
      taosMemoryFreeClear(pPKValue->pData);
×
1327
      pPKValue->nData = 0;
×
1328
    } else {
1329
      pPKValue->val = 0;
×
1330
    }
1331
  }
1332
  pLastCol->rowKey.numOfPKs = 0;
×
1333

1334
  // update colval
1335
  if (IS_VAR_DATA_TYPE(pLastCol->colVal.value.type) && pLastCol->colVal.value.nData > 0) {
×
1336
    taosMemoryFreeClear(pLastCol->colVal.value.pData);
×
1337
    pLastCol->colVal.value.nData = 0;
×
1338
  } else {
1339
    pLastCol->colVal.value.val = 0;
×
1340
  }
1341

1342
  pLastCol->colVal = COL_VAL_NONE(pLastCol->colVal.cid, pLastCol->colVal.value.type);
×
1343
  pLastCol->dirty = 1;
×
1344
  pLastCol->cacheStatus = cacheStatus;
×
1345
}
×
1346

1347
static int32_t tsdbCachePutToRocksdb(STsdb *pTsdb, SLastKey *pLastKey, SLastCol *pLastCol) {
×
1348
  int32_t code = 0;
×
1349
  char   *rocks_value = NULL;
×
1350
  size_t  vlen = 0;
×
1351

1352
  code = tsdbCacheSerialize(pLastCol, &rocks_value, &vlen);
×
1353
  if (code) {
×
1354
    tsdbError("tsdb/cache/putrocks: vgId:%d, serialize failed since %s.", TD_VID(pTsdb->pVnode), tstrerror(code));
×
1355
    TAOS_RETURN(code);
×
1356
  }
1357

1358
  rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
×
1359
  (void)taosThreadMutexLock(&pTsdb->rCache.writeBatchMutex);
×
1360
  rocksdb_writebatch_put(wb, (char *)pLastKey, ROCKS_KEY_LEN, rocks_value, vlen);
×
1361
  (void)taosThreadMutexUnlock(&pTsdb->rCache.writeBatchMutex);
×
1362

1363
  taosMemoryFree(rocks_value);
×
1364

1365
  TAOS_RETURN(code);
×
1366
}
1367

1368
static int32_t tsdbCachePutToLRU(STsdb *pTsdb, SLastKey *pLastKey, SLastCol *pLastCol, int8_t dirty) {
×
1369
  int32_t code = 0, lino = 0;
×
1370

1371
  SLastCol *pLRULastCol = taosMemoryCalloc(1, sizeof(SLastCol));
×
1372
  if (!pLRULastCol) {
×
1373
    return terrno;
×
1374
  }
1375

1376
  size_t charge = 0;
×
1377
  *pLRULastCol = *pLastCol;
×
1378
  pLRULastCol->dirty = dirty;
×
1379
  TAOS_CHECK_EXIT(tsdbCacheReallocSLastCol(pLRULastCol, &charge));
×
1380

1381
  LRUStatus status = taosLRUCacheInsert(pTsdb->lruCache, pLastKey, ROCKS_KEY_LEN, pLRULastCol, charge, tsdbCacheDeleter,
×
1382
                                        tsdbCacheOverWriter, NULL, TAOS_LRU_PRIORITY_LOW, pTsdb);
1383
  if (TAOS_LRU_STATUS_OK != status && TAOS_LRU_STATUS_OK_OVERWRITTEN != status) {
×
1384
    tsdbError("vgId:%d, %s failed at line %d status %d.", TD_VID(pTsdb->pVnode), __func__, __LINE__, status);
×
1385
    code = TSDB_CODE_FAILED;
×
1386
    pLRULastCol = NULL;
×
1387
  }
1388

1389
_exit:
×
1390
  if (TSDB_CODE_SUCCESS != code) {
×
1391
    taosMemoryFree(pLRULastCol);
×
1392
    tsdbError("tsdb/cache/putlru: vgId:%d, failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino, tstrerror(code));
×
1393
  }
1394

1395
  TAOS_RETURN(code);
×
1396
}
1397

1398
static int32_t tsdbCacheUpdate(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, SArray *updCtxArray) {
×
1399
  if (!updCtxArray || TARRAY_SIZE(updCtxArray) == 0) {
×
1400
    TAOS_RETURN(TSDB_CODE_SUCCESS);
×
1401
  }
1402

1403
  int32_t code = 0, lino = 0;
×
1404

1405
  int        num_keys = TARRAY_SIZE(updCtxArray);
×
1406
  SArray    *remainCols = NULL;
×
1407
  SLRUCache *pCache = pTsdb->lruCache;
×
1408

1409
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
1410
  for (int i = 0; i < num_keys; ++i) {
×
1411
    SLastUpdateCtx *updCtx = &((SLastUpdateCtx *)TARRAY_DATA(updCtxArray))[i];
×
1412
    int8_t          lflag = updCtx->lflag;
×
1413
    SRowKey        *pRowKey = &updCtx->tsdbRowKey.key;
×
1414
    SColVal        *pColVal = &updCtx->colVal;
×
1415

1416
    if (lflag == LFLAG_LAST && !COL_VAL_IS_VALUE(pColVal)) {
×
1417
      continue;
×
1418
    }
1419

1420
    SLastKey  *key = &(SLastKey){.lflag = lflag, .uid = uid, .cid = pColVal->cid};
×
1421
    LRUHandle *h = taosLRUCacheLookup(pCache, key, ROCKS_KEY_LEN);
×
1422
    if (h) {
×
1423
      SLastCol *pLastCol = (SLastCol *)taosLRUCacheValue(pCache, h);
×
1424
      if (pLastCol->cacheStatus != TSDB_LAST_CACHE_NO_CACHE) {
×
1425
        int32_t cmp_res = tRowKeyCompare(&pLastCol->rowKey, pRowKey);
×
1426
        if (cmp_res < 0 || (cmp_res == 0 && !COL_VAL_IS_NONE(pColVal))) {
×
1427
          SLastCol newLastCol = {
×
1428
              .rowKey = *pRowKey, .colVal = *pColVal, .dirty = 1, .cacheStatus = TSDB_LAST_CACHE_VALID};
1429
          code = tsdbCachePutToLRU(pTsdb, key, &newLastCol, 1);
×
1430
        }
1431
      }
1432

1433
      tsdbLRUCacheRelease(pCache, h, false);
×
1434
      TAOS_CHECK_EXIT(code);
×
1435
    } else {
1436
      if (!remainCols) {
×
1437
        remainCols = taosArrayInit(num_keys * 2, sizeof(SIdxKey));
×
1438
        if (!remainCols) {
×
1439
          TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1440
        }
1441
      }
1442
      if (!taosArrayPush(remainCols, &(SIdxKey){i, *key})) {
×
1443
        TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1444
      }
1445
    }
1446
  }
1447

1448
  if (remainCols) {
×
1449
    num_keys = TARRAY_SIZE(remainCols);
×
1450
  }
1451
  if (remainCols && num_keys > 0) {
×
1452
    char  **keys_list = NULL;
×
1453
    size_t *keys_list_sizes = NULL;
×
1454
    char  **values_list = NULL;
×
1455
    size_t *values_list_sizes = NULL;
×
1456
    char  **errs = NULL;
×
1457
    keys_list = taosMemoryCalloc(num_keys, sizeof(char *));
×
1458
    if (!keys_list) {
×
1459
      (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1460
      return terrno;
×
1461
    }
1462
    keys_list_sizes = taosMemoryCalloc(num_keys, sizeof(size_t));
×
1463
    if (!keys_list_sizes) {
×
1464
      taosMemoryFree(keys_list);
×
1465
      (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1466
      return terrno;
×
1467
    }
1468
    for (int i = 0; i < num_keys; ++i) {
×
1469
      SIdxKey *idxKey = &((SIdxKey *)TARRAY_DATA(remainCols))[i];
×
1470

1471
      keys_list[i] = (char *)&idxKey->key;
×
1472
      keys_list_sizes[i] = ROCKS_KEY_LEN;
×
1473
    }
1474

1475
    rocksMayWrite(pTsdb, true);  // flush writebatch cache
×
1476

1477
    code = tsdbCacheGetValuesFromRocks(pTsdb, num_keys, (const char *const *)keys_list, keys_list_sizes, &values_list,
×
1478
                                       &values_list_sizes);
1479
    if (code) {
×
1480
      taosMemoryFree(keys_list);
×
1481
      taosMemoryFree(keys_list_sizes);
×
1482
      goto _exit;
×
1483
    }
1484

1485
    rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
×
1486
    for (int i = 0; i < num_keys; ++i) {
×
1487
      SIdxKey        *idxKey = &((SIdxKey *)TARRAY_DATA(remainCols))[i];
×
1488
      SLastUpdateCtx *updCtx = (SLastUpdateCtx *)taosArrayGet(updCtxArray, idxKey->idx);
×
1489
      SRowKey        *pRowKey = &updCtx->tsdbRowKey.key;
×
1490
      SColVal        *pColVal = &updCtx->colVal;
×
1491

1492
      SLastCol *pLastCol = NULL;
×
1493
      if (values_list[i] != NULL) {
×
1494
        code = tsdbCacheDeserialize(values_list[i], values_list_sizes[i], &pLastCol);
×
1495
        if (code != TSDB_CODE_SUCCESS) {
×
1496
          tsdbError("vgId:%d, %s deserialize failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1497
                    tstrerror(code));
1498
          goto _exit;
×
1499
        }
1500
      }
1501
      /*
1502
      if (code) {
1503
        tsdbError("tsdb/cache: vgId:%d, deserialize failed since %s.", TD_VID(pTsdb->pVnode), tstrerror(code));
1504
      }
1505
      */
1506
      SLastCol *pToFree = pLastCol;
×
1507

1508
      if (pLastCol && pLastCol->cacheStatus == TSDB_LAST_CACHE_NO_CACHE) {
×
1509
        if ((code = tsdbCachePutToLRU(pTsdb, &idxKey->key, pLastCol, 0)) != TSDB_CODE_SUCCESS) {
×
1510
          tsdbError("tsdb/cache: vgId:%d, put lru failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino,
×
1511
                    tstrerror(code));
1512
          taosMemoryFreeClear(pToFree);
×
1513
          break;
×
1514
        }
1515

1516
        // cache invalid => skip update
1517
        taosMemoryFreeClear(pToFree);
×
1518
        continue;
×
1519
      }
1520

1521
      if (IS_LAST_KEY(idxKey->key) && !COL_VAL_IS_VALUE(pColVal)) {
×
1522
        taosMemoryFreeClear(pToFree);
×
1523
        continue;
×
1524
      }
1525

1526
      int32_t cmp_res = 1;
×
1527
      if (pLastCol) {
×
1528
        cmp_res = tRowKeyCompare(&pLastCol->rowKey, pRowKey);
×
1529
      }
1530

1531
      if (NULL == pLastCol || cmp_res < 0 || (cmp_res == 0 && !COL_VAL_IS_NONE(pColVal))) {
×
1532
        SLastCol lastColTmp = {
×
1533
            .rowKey = *pRowKey, .colVal = *pColVal, .dirty = 0, .cacheStatus = TSDB_LAST_CACHE_VALID};
1534
        if ((code = tsdbCachePutToRocksdb(pTsdb, &idxKey->key, &lastColTmp)) != TSDB_CODE_SUCCESS) {
×
1535
          tsdbError("tsdb/cache: vgId:%d, put rocks failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino,
×
1536
                    tstrerror(code));
1537
          taosMemoryFreeClear(pToFree);
×
1538
          break;
×
1539
        }
1540
        if ((code = tsdbCachePutToLRU(pTsdb, &idxKey->key, &lastColTmp, 0)) != TSDB_CODE_SUCCESS) {
×
1541
          tsdbError("tsdb/cache: vgId:%d, put lru failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino,
×
1542
                    tstrerror(code));
1543
          taosMemoryFreeClear(pToFree);
×
1544
          break;
×
1545
        }
1546
      }
1547

1548
      taosMemoryFreeClear(pToFree);
×
1549
    }
1550

1551
    rocksMayWrite(pTsdb, false);
×
1552

1553
    taosMemoryFree(keys_list);
×
1554
    taosMemoryFree(keys_list_sizes);
×
1555
    if (values_list) {
×
1556
      for (int i = 0; i < num_keys; ++i) {
×
1557
        rocksdb_free(values_list[i]);
×
1558
      }
1559
      taosMemoryFree(values_list);
×
1560
    }
1561
    taosMemoryFree(values_list_sizes);
×
1562
  }
1563

1564
_exit:
×
1565
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
1566
  taosArrayDestroy(remainCols);
×
1567

1568
  if (code) {
×
1569
    tsdbError("tsdb/cache: vgId:%d, update failed at line %d since %s.", TD_VID(pTsdb->pVnode), __LINE__,
×
1570
              tstrerror(code));
1571
  }
1572

1573
  TAOS_RETURN(code);
×
1574
}
1575

1576
int32_t tsdbCacheRowFormatUpdate(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, int64_t version, int32_t nRow,
×
1577
                                 SRow **aRow) {
1578
  int32_t code = 0, lino = 0;
×
1579

1580
  // 1. prepare last
1581
  TSDBROW      lRow = {.type = TSDBROW_ROW_FMT, .pTSRow = aRow[nRow - 1], .version = version};
×
1582
  STSchema    *pTSchema = NULL;
×
1583
  int32_t      sver = TSDBROW_SVERSION(&lRow);
×
1584
  SSHashObj   *iColHash = NULL;
×
1585
  STSDBRowIter iter = {0};
×
1586

1587
  TAOS_CHECK_GOTO(tsdbUpdateSkm(pTsdb, suid, uid, sver), &lino, _exit);
×
1588
  pTSchema = pTsdb->rCache.pTSchema;
×
1589

1590
  TSDBROW tRow = {.type = TSDBROW_ROW_FMT, .version = version};
×
1591
  int32_t nCol = pTSchema->numOfCols;
×
1592
  SArray *ctxArray = pTsdb->rCache.ctxArray;
×
1593

1594
  // 1. prepare by lrow
1595
  STsdbRowKey tsdbRowKey = {0};
×
1596
  tsdbRowGetKey(&lRow, &tsdbRowKey);
×
1597

1598
  TAOS_CHECK_GOTO(tsdbRowIterOpen(&iter, &lRow, pTSchema), &lino, _exit);
×
1599

1600
  int32_t iCol = 0;
×
1601
  for (SColVal *pColVal = tsdbRowIterNext(&iter); pColVal && iCol < nCol; pColVal = tsdbRowIterNext(&iter), iCol++) {
×
1602
    SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST_ROW, .tsdbRowKey = tsdbRowKey, .colVal = *pColVal};
×
1603
    if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1604
      TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1605
    }
1606

1607
    if (COL_VAL_IS_VALUE(pColVal)) {
×
1608
      updateCtx.lflag = LFLAG_LAST;
×
1609
      if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1610
        TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1611
      }
1612
    } else {
1613
      if (!iColHash) {
×
1614
        iColHash = tSimpleHashInit(16, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT));
×
1615
        if (iColHash == NULL) {
×
1616
          TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _exit);
×
1617
        }
1618
      }
1619

1620
      if (tSimpleHashPut(iColHash, &iCol, sizeof(iCol), NULL, 0)) {
×
1621
        TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _exit);
×
1622
      }
1623
    }
1624
  }
1625

1626
  // 2. prepare by the other rows
1627
  for (int32_t iRow = nRow - 2; iRow >= 0; --iRow) {
×
1628
    if (tSimpleHashGetSize(iColHash) == 0) {
×
1629
      break;
×
1630
    }
1631

1632
    tRow.pTSRow = aRow[iRow];
×
1633

1634
    STsdbRowKey tsdbRowKey = {0};
×
1635
    tsdbRowGetKey(&tRow, &tsdbRowKey);
×
1636

1637
    void   *pIte = NULL;
×
1638
    int32_t iter = 0;
×
1639
    while ((pIte = tSimpleHashIterate(iColHash, pIte, &iter)) != NULL) {
×
1640
      int32_t iCol = ((int32_t *)pIte)[0];
×
1641
      SColVal colVal = COL_VAL_NONE(0, 0);
×
1642
      tsdbRowGetColVal(&tRow, pTSchema, iCol, &colVal);
×
1643

1644
      if (COL_VAL_IS_VALUE(&colVal)) {
×
1645
        SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST, .tsdbRowKey = tsdbRowKey, .colVal = colVal};
×
1646
        if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1647
          TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1648
        }
1649
        code = tSimpleHashIterateRemove(iColHash, &iCol, sizeof(iCol), &pIte, &iter);
×
1650
        if (code != TSDB_CODE_SUCCESS) {
×
1651
          tsdbTrace("vgId:%d, %s tSimpleHashIterateRemove failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__,
×
1652
                    __LINE__, tstrerror(code));
1653
        }
1654
      }
1655
    }
1656
  }
1657

1658
  TAOS_CHECK_GOTO(tsdbCacheUpdate(pTsdb, suid, uid, ctxArray), &lino, _exit);
×
1659

1660
_exit:
×
1661
  if (code) {
×
1662
    tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
1663
  }
1664

1665
  tsdbRowClose(&iter);
×
1666
  tSimpleHashCleanup(iColHash);
×
1667
  taosArrayClear(ctxArray);
×
1668

1669
  TAOS_RETURN(code);
×
1670
}
1671

1672
int32_t tsdbCacheColFormatUpdate(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, SBlockData *pBlockData) {
×
1673
  int32_t      code = 0, lino = 0;
×
1674
  STSDBRowIter iter = {0};
×
1675
  STSchema    *pTSchema = NULL;
×
1676
  SArray      *ctxArray = NULL;
×
1677

1678
  TSDBROW lRow = tsdbRowFromBlockData(pBlockData, pBlockData->nRow - 1);
×
1679
  int32_t sver = TSDBROW_SVERSION(&lRow);
×
1680

1681
  TAOS_CHECK_RETURN(metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, uid, sver, &pTSchema));
×
1682

1683
  ctxArray = taosArrayInit(pBlockData->nColData, sizeof(SLastUpdateCtx));
×
1684
  if (ctxArray == NULL) {
×
1685
    TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1686
  }
1687

1688
  // 1. prepare last
1689
  STsdbRowKey tsdbRowKey = {0};
×
1690
  tsdbRowGetKey(&lRow, &tsdbRowKey);
×
1691

1692
  {
1693
    SLastUpdateCtx updateCtx = {
×
1694
        .lflag = LFLAG_LAST,
1695
        .tsdbRowKey = tsdbRowKey,
1696
        .colVal = COL_VAL_VALUE(PRIMARYKEY_TIMESTAMP_COL_ID, ((SValue){.type = TSDB_DATA_TYPE_TIMESTAMP,
×
1697
                                                                       .val = lRow.pBlockData->aTSKEY[lRow.iRow]}))};
1698
    if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1699
      TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1700
    }
1701
  }
1702

1703
  TSDBROW tRow = tsdbRowFromBlockData(pBlockData, 0);
×
1704

1705
  for (int32_t iColData = 0; iColData < pBlockData->nColData; ++iColData) {
×
1706
    SColData *pColData = &pBlockData->aColData[iColData];
×
1707
    if ((pColData->flag & HAS_VALUE) != HAS_VALUE) {
×
1708
      continue;
×
1709
    }
1710

1711
    for (tRow.iRow = pBlockData->nRow - 1; tRow.iRow >= 0; --tRow.iRow) {
×
1712
      STsdbRowKey tsdbRowKey = {0};
×
1713
      tsdbRowGetKey(&tRow, &tsdbRowKey);
×
1714

1715
      uint8_t colType = tColDataGetBitValue(pColData, tRow.iRow);
×
1716
      if (colType == 2) {
×
1717
        SColVal colVal = COL_VAL_NONE(pColData->cid, pColData->type);
×
1718
        TAOS_CHECK_GOTO(tColDataGetValue(pColData, tRow.iRow, &colVal), &lino, _exit);
×
1719

1720
        SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST, .tsdbRowKey = tsdbRowKey, .colVal = colVal};
×
1721
        if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1722
          TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1723
        }
1724
        break;
×
1725
      }
1726
    }
1727
  }
1728

1729
  // 2. prepare last row
1730
  TAOS_CHECK_GOTO(tsdbRowIterOpen(&iter, &lRow, pTSchema), &lino, _exit);
×
1731
  for (SColVal *pColVal = tsdbRowIterNext(&iter); pColVal; pColVal = tsdbRowIterNext(&iter)) {
×
1732
    SLastUpdateCtx updateCtx = {.lflag = LFLAG_LAST_ROW, .tsdbRowKey = tsdbRowKey, .colVal = *pColVal};
×
1733
    if (!taosArrayPush(ctxArray, &updateCtx)) {
×
1734
      TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
1735
    }
1736
  }
1737

1738
  TAOS_CHECK_GOTO(tsdbCacheUpdate(pTsdb, suid, uid, ctxArray), &lino, _exit);
×
1739

1740
_exit:
×
1741
  tsdbRowClose(&iter);
×
1742
  taosMemoryFreeClear(pTSchema);
×
1743
  taosArrayDestroy(ctxArray);
×
1744

1745
  TAOS_RETURN(code);
×
1746
}
1747

1748
static int32_t mergeLastCid(tb_uid_t uid, STsdb *pTsdb, SArray **ppLastArray, SCacheRowsReader *pr, int16_t *aCols,
1749
                            int nCols, int16_t *slotIds);
1750

1751
static int32_t mergeLastRowCid(tb_uid_t uid, STsdb *pTsdb, SArray **ppLastArray, SCacheRowsReader *pr, int16_t *aCols,
1752
                               int nCols, int16_t *slotIds);
1753

1754
static int32_t tsdbCacheLoadFromRaw(STsdb *pTsdb, tb_uid_t uid, SArray *pLastArray, SArray *remainCols,
×
1755
                                    SCacheRowsReader *pr, int8_t ltype) {
1756
  int32_t               code = 0, lino = 0;
×
1757
  rocksdb_writebatch_t *wb = NULL;
×
1758
  SArray               *pTmpColArray = NULL;
×
1759
  bool                  extraTS = false;
×
1760

1761
  SIdxKey *idxKey = taosArrayGet(remainCols, 0);
×
1762
  if (idxKey->key.cid != PRIMARYKEY_TIMESTAMP_COL_ID) {
×
1763
    // ignore 'ts' loaded from cache and load it from tsdb
1764
    // SLastCol *pLastCol = taosArrayGet(pLastArray, 0);
1765
    // tsdbCacheUpdateLastColToNone(pLastCol, TSDB_LAST_CACHE_NO_CACHE);
1766

1767
    SLastKey *key = &(SLastKey){.lflag = ltype, .uid = uid, .cid = PRIMARYKEY_TIMESTAMP_COL_ID};
×
1768
    if (!taosArrayInsert(remainCols, 0, &(SIdxKey){0, *key})) {
×
1769
      TAOS_RETURN(terrno);
×
1770
    }
1771

1772
    extraTS = true;
×
1773
  }
1774

1775
  int      num_keys = TARRAY_SIZE(remainCols);
×
1776
  int16_t *slotIds = taosMemoryMalloc(num_keys * sizeof(int16_t));
×
1777

1778
  int16_t *lastColIds = NULL, *lastSlotIds = NULL, *lastrowColIds = NULL, *lastrowSlotIds = NULL;
×
1779
  lastColIds = taosMemoryMalloc(num_keys * sizeof(int16_t));
×
1780
  lastSlotIds = taosMemoryMalloc(num_keys * sizeof(int16_t));
×
1781
  lastrowColIds = taosMemoryMalloc(num_keys * sizeof(int16_t));
×
1782
  lastrowSlotIds = taosMemoryMalloc(num_keys * sizeof(int16_t));
×
1783
  SArray *lastTmpColArray = NULL, *lastTmpIndexArray = NULL, *lastrowTmpColArray = NULL, *lastrowTmpIndexArray = NULL;
×
1784

1785
  int lastIndex = 0;
×
1786
  int lastrowIndex = 0;
×
1787

1788
  if (!slotIds || !lastColIds || !lastSlotIds || !lastrowColIds || !lastrowSlotIds) {
×
1789
    TAOS_CHECK_EXIT(terrno);
×
1790
  }
1791

1792
  for (int i = 0; i < num_keys; ++i) {
×
1793
    SIdxKey *idxKey = taosArrayGet(remainCols, i);
×
1794
    if (extraTS && !i) {
×
1795
      slotIds[i] = 0;
×
1796
    } else {
1797
      slotIds[i] = pr->pSlotIds[idxKey->idx];
×
1798
    }
1799

1800
    if (IS_LAST_KEY(idxKey->key)) {
×
1801
      if (NULL == lastTmpIndexArray) {
×
1802
        lastTmpIndexArray = taosArrayInit(num_keys, sizeof(int32_t));
×
1803
        if (!lastTmpIndexArray) {
×
1804
          TAOS_CHECK_EXIT(terrno);
×
1805
        }
1806
      }
1807
      if (!taosArrayPush(lastTmpIndexArray, &(i))) {
×
1808
        TAOS_CHECK_EXIT(terrno);
×
1809
      }
1810
      lastColIds[lastIndex] = idxKey->key.cid;
×
1811
      if (extraTS && !i) {
×
1812
        lastSlotIds[lastIndex] = 0;
×
1813
      } else {
1814
        lastSlotIds[lastIndex] = pr->pSlotIds[idxKey->idx];
×
1815
      }
1816
      lastIndex++;
×
1817
    } else {
1818
      if (NULL == lastrowTmpIndexArray) {
×
1819
        lastrowTmpIndexArray = taosArrayInit(num_keys, sizeof(int32_t));
×
1820
        if (!lastrowTmpIndexArray) {
×
1821
          TAOS_CHECK_EXIT(terrno);
×
1822
        }
1823
      }
1824
      if (!taosArrayPush(lastrowTmpIndexArray, &(i))) {
×
1825
        TAOS_CHECK_EXIT(terrno);
×
1826
      }
1827
      lastrowColIds[lastrowIndex] = idxKey->key.cid;
×
1828
      if (extraTS && !i) {
×
1829
        lastrowSlotIds[lastrowIndex] = 0;
×
1830
      } else {
1831
        lastrowSlotIds[lastrowIndex] = pr->pSlotIds[idxKey->idx];
×
1832
      }
1833
      lastrowIndex++;
×
1834
    }
1835
  }
1836

1837
  pTmpColArray = taosArrayInit(lastIndex + lastrowIndex, sizeof(SLastCol));
×
1838
  if (!pTmpColArray) {
×
1839
    TAOS_CHECK_EXIT(terrno);
×
1840
  }
1841

1842
  if (lastTmpIndexArray != NULL) {
×
1843
    TAOS_CHECK_EXIT(mergeLastCid(uid, pTsdb, &lastTmpColArray, pr, lastColIds, lastIndex, lastSlotIds));
×
1844
    for (int i = 0; i < taosArrayGetSize(lastTmpColArray); i++) {
×
1845
      if (!taosArrayInsert(pTmpColArray, *(int32_t *)taosArrayGet(lastTmpIndexArray, i),
×
1846
                           taosArrayGet(lastTmpColArray, i))) {
×
1847
        TAOS_CHECK_EXIT(terrno);
×
1848
      }
1849
    }
1850
  }
1851

1852
  if (lastrowTmpIndexArray != NULL) {
×
1853
    TAOS_CHECK_EXIT(mergeLastRowCid(uid, pTsdb, &lastrowTmpColArray, pr, lastrowColIds, lastrowIndex, lastrowSlotIds));
×
1854
    for (int i = 0; i < taosArrayGetSize(lastrowTmpColArray); i++) {
×
1855
      if (!taosArrayInsert(pTmpColArray, *(int32_t *)taosArrayGet(lastrowTmpIndexArray, i),
×
1856
                           taosArrayGet(lastrowTmpColArray, i))) {
×
1857
        TAOS_CHECK_EXIT(terrno);
×
1858
      }
1859
    }
1860
  }
1861

1862
  SLRUCache *pCache = pTsdb->lruCache;
×
1863
  for (int i = 0; i < num_keys; ++i) {
×
1864
    SIdxKey  *idxKey = taosArrayGet(remainCols, i);
×
1865
    SLastCol *pLastCol = NULL;
×
1866

1867
    if (pTmpColArray && TARRAY_SIZE(pTmpColArray) >= i + 1) {
×
1868
      pLastCol = taosArrayGet(pTmpColArray, i);
×
1869
    }
1870

1871
    // still null, then make up a none col value
1872
    SLastCol noneCol = {.rowKey.ts = TSKEY_MIN,
×
1873
                        .colVal = COL_VAL_NONE(idxKey->key.cid, pr->pSchema->columns[slotIds[i]].type),
×
1874
                        .cacheStatus = TSDB_LAST_CACHE_VALID};
1875
    if (!pLastCol) {
×
1876
      pLastCol = &noneCol;
×
1877
    }
1878

1879
    if (!extraTS || i > 0) {
×
1880
      taosArraySet(pLastArray, idxKey->idx, pLastCol);
×
1881
    }
1882
    // taosArrayRemove(remainCols, i);
1883

1884
    if (/*!pTmpColArray*/ lastTmpIndexArray && !lastTmpColArray) {
×
1885
      continue;
×
1886
    }
1887
    if (/*!pTmpColArray*/ lastrowTmpIndexArray && !lastrowTmpColArray) {
×
1888
      continue;
×
1889
    }
1890

1891
    // store result back to rocks cache
1892
    code = tsdbCachePutToRocksdb(pTsdb, &idxKey->key, pLastCol);
×
1893
    if (code) {
×
1894
      tsdbError("vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
1895
      TAOS_CHECK_EXIT(code);
×
1896
    }
1897

1898
    code = tsdbCachePutToLRU(pTsdb, &idxKey->key, pLastCol, 0);
×
1899
    if (code) {
×
1900
      tsdbError("vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
1901
      TAOS_CHECK_EXIT(code);
×
1902
    }
1903
  }
1904

1905
  rocksMayWrite(pTsdb, false);
×
1906

1907
_exit:
×
1908
  taosArrayDestroy(lastrowTmpIndexArray);
×
1909
  taosArrayDestroy(lastrowTmpColArray);
×
1910
  taosArrayDestroy(lastTmpIndexArray);
×
1911
  taosArrayDestroy(lastTmpColArray);
×
1912

1913
  taosMemoryFree(lastColIds);
×
1914
  taosMemoryFree(lastSlotIds);
×
1915
  taosMemoryFree(lastrowColIds);
×
1916
  taosMemoryFree(lastrowSlotIds);
×
1917

1918
  taosArrayDestroy(pTmpColArray);
×
1919

1920
  taosMemoryFree(slotIds);
×
1921

1922
  TAOS_RETURN(code);
×
1923
}
1924

1925
static int32_t tsdbCacheLoadFromRocks(STsdb *pTsdb, tb_uid_t uid, SArray *pLastArray, SArray *remainCols,
×
1926
                                      SArray *ignoreFromRocks, SCacheRowsReader *pr, int8_t ltype) {
1927
  int32_t code = 0, lino = 0;
×
1928
  int     num_keys = TARRAY_SIZE(remainCols);
×
1929
  char  **keys_list = taosMemoryMalloc(num_keys * sizeof(char *));
×
1930
  size_t *keys_list_sizes = taosMemoryMalloc(num_keys * sizeof(size_t));
×
1931
  char   *key_list = taosMemoryMalloc(num_keys * ROCKS_KEY_LEN);
×
1932
  if (!keys_list || !keys_list_sizes || !key_list) {
×
1933
    taosMemoryFree(keys_list);
×
1934
    taosMemoryFree(keys_list_sizes);
×
1935
    TAOS_RETURN(terrno);
×
1936
  }
1937
  char  **values_list = NULL;
×
1938
  size_t *values_list_sizes = NULL;
×
1939
  for (int i = 0; i < num_keys; ++i) {
×
1940
    memcpy(key_list + i * ROCKS_KEY_LEN, &((SIdxKey *)taosArrayGet(remainCols, i))->key, ROCKS_KEY_LEN);
×
1941
    keys_list[i] = key_list + i * ROCKS_KEY_LEN;
×
1942
    keys_list_sizes[i] = ROCKS_KEY_LEN;
×
1943
  }
1944

1945
  rocksMayWrite(pTsdb, true);  // flush writebatch cache
×
1946

1947
  code = tsdbCacheGetValuesFromRocks(pTsdb, num_keys, (const char *const *)keys_list, keys_list_sizes, &values_list,
×
1948
                                     &values_list_sizes);
1949
  if (code) {
×
1950
    taosMemoryFree(key_list);
×
1951
    taosMemoryFree(keys_list);
×
1952
    taosMemoryFree(keys_list_sizes);
×
1953
    TAOS_RETURN(code);
×
1954
  }
1955

1956
  SLRUCache *pCache = pTsdb->lruCache;
×
1957
  for (int i = 0, j = 0; i < num_keys && j < TARRAY_SIZE(remainCols); ++i) {
×
1958
    SLastCol *pLastCol = NULL;
×
1959
    bool      ignore = ((bool *)TARRAY_DATA(ignoreFromRocks))[i];
×
1960
    if (ignore) {
×
1961
      ++j;
×
1962
      continue;
×
1963
    }
1964

1965
    if (values_list[i] != NULL) {
×
1966
      code = tsdbCacheDeserialize(values_list[i], values_list_sizes[i], &pLastCol);
×
1967
      if (code != TSDB_CODE_SUCCESS) {
×
1968
        tsdbError("vgId:%d, %s deserialize failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
1969
                  tstrerror(code));
1970
        goto _exit;
×
1971
      }
1972
    }
1973
    SLastCol *pToFree = pLastCol;
×
1974
    SIdxKey  *idxKey = &((SIdxKey *)TARRAY_DATA(remainCols))[j];
×
1975
    if (pLastCol && pLastCol->cacheStatus != TSDB_LAST_CACHE_NO_CACHE) {
×
1976
      code = tsdbCachePutToLRU(pTsdb, &idxKey->key, pLastCol, 0);
×
1977
      if (code) {
×
1978
        tsdbError("vgId:%d, %s failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__, tstrerror(code));
×
1979
        taosMemoryFreeClear(pToFree);
×
1980
        TAOS_CHECK_EXIT(code);
×
1981
      }
1982

1983
      SLastCol lastCol = *pLastCol;
×
1984
      code = tsdbCacheReallocSLastCol(&lastCol, NULL);
×
1985
      if (TSDB_CODE_SUCCESS != code) {
×
1986
        taosMemoryFreeClear(pToFree);
×
1987
        TAOS_CHECK_EXIT(code);
×
1988
      }
1989

1990
      taosArraySet(pLastArray, idxKey->idx, &lastCol);
×
1991
      taosArrayRemove(remainCols, j);
×
1992
      taosArrayRemove(ignoreFromRocks, j);
×
1993
    } else {
1994
      ++j;
×
1995
    }
1996

1997
    taosMemoryFreeClear(pToFree);
×
1998
  }
1999

2000
  if (TARRAY_SIZE(remainCols) > 0) {
×
2001
    // tsdbTrace("tsdb/cache: vgId: %d, load %" PRId64 " from raw", TD_VID(pTsdb->pVnode), uid);
2002
    code = tsdbCacheLoadFromRaw(pTsdb, uid, pLastArray, remainCols, pr, ltype);
×
2003
  }
2004

2005
_exit:
×
2006
  taosMemoryFree(key_list);
×
2007
  taosMemoryFree(keys_list);
×
2008
  taosMemoryFree(keys_list_sizes);
×
2009
  if (values_list) {
×
2010
    for (int i = 0; i < num_keys; ++i) {
×
2011
      rocksdb_free(values_list[i]);
×
2012
    }
2013
    taosMemoryFree(values_list);
×
2014
  }
2015
  taosMemoryFree(values_list_sizes);
×
2016

2017
  TAOS_RETURN(code);
×
2018
}
2019

2020
static int32_t tsdbCacheGetBatchFromLru(STsdb *pTsdb, tb_uid_t uid, SArray *pLastArray, SCacheRowsReader *pr,
×
2021
                                        int8_t ltype, SArray *keyArray) {
2022
  int32_t    code = 0, lino = 0;
×
2023
  SArray    *remainCols = NULL;
×
2024
  SArray    *ignoreFromRocks = NULL;
×
2025
  SLRUCache *pCache = pTsdb->lruCache;
×
2026
  SArray    *pCidList = pr->pCidList;
×
2027
  int        numKeys = TARRAY_SIZE(pCidList);
×
2028

2029
  for (int i = 0; i < numKeys; ++i) {
×
2030
    int16_t cid = ((int16_t *)TARRAY_DATA(pCidList))[i];
×
2031

2032
    SLastKey key = {.lflag = ltype, .uid = uid, .cid = cid};
×
2033
    // for select last_row, last case
2034
    int32_t funcType = FUNCTION_TYPE_CACHE_LAST;
×
2035
    if (pr->pFuncTypeList != NULL && taosArrayGetSize(pr->pFuncTypeList) > i) {
×
2036
      funcType = ((int32_t *)TARRAY_DATA(pr->pFuncTypeList))[i];
×
2037
    }
2038
    if (((pr->type & CACHESCAN_RETRIEVE_LAST) == CACHESCAN_RETRIEVE_LAST) && FUNCTION_TYPE_CACHE_LAST_ROW == funcType) {
×
2039
      int8_t tempType = CACHESCAN_RETRIEVE_LAST_ROW | (pr->type ^ CACHESCAN_RETRIEVE_LAST);
×
2040
      key.lflag = (tempType & CACHESCAN_RETRIEVE_LAST) >> 3;
×
2041
    }
2042

2043
    if (!taosArrayPush(keyArray, &key)) {
×
2044
      TAOS_CHECK_EXIT(terrno);
×
2045
    }
2046

2047
    LRUHandle *h = taosLRUCacheLookup(pCache, &key, ROCKS_KEY_LEN);
×
2048
    SLastCol  *pLastCol = h ? (SLastCol *)taosLRUCacheValue(pCache, h) : NULL;
×
2049
    if (h && pLastCol->cacheStatus != TSDB_LAST_CACHE_NO_CACHE) {
×
2050
      SLastCol lastCol = *pLastCol;
×
2051
      if (TSDB_CODE_SUCCESS != (code = tsdbCacheReallocSLastCol(&lastCol, NULL))) {
×
2052
        tsdbLRUCacheRelease(pCache, h, false);
×
2053
        TAOS_CHECK_GOTO(code, NULL, _exit);
×
2054
      }
2055

2056
      if (taosArrayPush(pLastArray, &lastCol) == NULL) {
×
2057
        code = terrno;
×
2058
        tsdbLRUCacheRelease(pCache, h, false);
×
2059
        goto _exit;
×
2060
      }
2061
    } else {
2062
      // no cache or cache is invalid
2063
      SLastCol noneCol = {.rowKey.ts = TSKEY_MIN,
×
2064
                          .colVal = COL_VAL_NONE(cid, pr->pSchema->columns[pr->pSlotIds[i]].type)};
×
2065

2066
      if (taosArrayPush(pLastArray, &noneCol) == NULL) {
×
2067
        code = terrno;
×
2068
        tsdbLRUCacheRelease(pCache, h, false);
×
2069
        goto _exit;
×
2070
      }
2071

2072
      if (!remainCols) {
×
2073
        if ((remainCols = taosArrayInit(numKeys, sizeof(SIdxKey))) == NULL) {
×
2074
          code = terrno;
×
2075
          tsdbLRUCacheRelease(pCache, h, false);
×
2076
          goto _exit;
×
2077
        }
2078
      }
2079
      if (!ignoreFromRocks) {
×
2080
        if ((ignoreFromRocks = taosArrayInit(numKeys, sizeof(bool))) == NULL) {
×
2081
          code = terrno;
×
2082
          tsdbLRUCacheRelease(pCache, h, false);
×
2083
          goto _exit;
×
2084
        }
2085
      }
2086
      if (taosArrayPush(remainCols, &(SIdxKey){i, key}) == NULL) {
×
2087
        code = terrno;
×
2088
        tsdbLRUCacheRelease(pCache, h, false);
×
2089
        goto _exit;
×
2090
      }
2091
      bool ignoreRocks = pLastCol ? (pLastCol->cacheStatus == TSDB_LAST_CACHE_NO_CACHE) : false;
×
2092
      if (taosArrayPush(ignoreFromRocks, &ignoreRocks) == NULL) {
×
2093
        code = terrno;
×
2094
        tsdbLRUCacheRelease(pCache, h, false);
×
2095
        goto _exit;
×
2096
      }
2097
    }
2098

2099
    if (h) {
×
2100
      tsdbLRUCacheRelease(pCache, h, false);
×
2101
    }
2102
  }
2103

2104
  if (remainCols && TARRAY_SIZE(remainCols) > 0) {
×
2105
    (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
2106

2107
    for (int i = 0; i < TARRAY_SIZE(remainCols);) {
×
2108
      SIdxKey   *idxKey = &((SIdxKey *)TARRAY_DATA(remainCols))[i];
×
2109
      LRUHandle *h = taosLRUCacheLookup(pCache, &idxKey->key, ROCKS_KEY_LEN);
×
2110
      SLastCol  *pLastCol = h ? (SLastCol *)taosLRUCacheValue(pCache, h) : NULL;
×
2111
      if (h && pLastCol->cacheStatus != TSDB_LAST_CACHE_NO_CACHE) {
×
2112
        SLastCol lastCol = *pLastCol;
×
2113
        code = tsdbCacheReallocSLastCol(&lastCol, NULL);
×
2114
        if (code) {
×
2115
          tsdbLRUCacheRelease(pCache, h, false);
×
2116
          (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
2117
          TAOS_RETURN(code);
×
2118
        }
2119

2120
        taosArraySet(pLastArray, idxKey->idx, &lastCol);
×
2121

2122
        taosArrayRemove(remainCols, i);
×
2123
        taosArrayRemove(ignoreFromRocks, i);
×
2124
      } else {
2125
        // no cache or cache is invalid
2126
        ++i;
×
2127
      }
2128
      if (h) {
×
2129
        tsdbLRUCacheRelease(pCache, h, false);
×
2130
      }
2131
    }
2132

2133
    // tsdbTrace("tsdb/cache: vgId: %d, load %" PRId64 " from rocks", TD_VID(pTsdb->pVnode), uid);
2134
    code = tsdbCacheLoadFromRocks(pTsdb, uid, pLastArray, remainCols, ignoreFromRocks, pr, ltype);
×
2135

2136
    (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
2137
  }
2138

2139
_exit:
×
2140
  if (remainCols) {
×
2141
    taosArrayDestroy(remainCols);
×
2142
  }
2143
  if (ignoreFromRocks) {
×
2144
    taosArrayDestroy(ignoreFromRocks);
×
2145
  }
2146

2147
  TAOS_RETURN(code);
×
2148
}
2149

2150
typedef enum SMEMNEXTROWSTATES {
2151
  SMEMNEXTROW_ENTER,
2152
  SMEMNEXTROW_NEXT,
2153
} SMEMNEXTROWSTATES;
2154

2155
typedef struct SMemNextRowIter {
2156
  SMEMNEXTROWSTATES state;
2157
  STbData          *pMem;  // [input]
2158
  STbDataIter       iter;  // mem buffer skip list iterator
2159
  int64_t           lastTs;
2160
} SMemNextRowIter;
2161

2162
static int32_t getNextRowFromMem(void *iter, TSDBROW **ppRow, bool *pIgnoreEarlierTs, bool isLast, int16_t *aCols,
×
2163
                                 int nCols) {
2164
  SMemNextRowIter *state = (SMemNextRowIter *)iter;
×
2165
  int32_t          code = 0;
×
2166
  *pIgnoreEarlierTs = false;
×
2167
  switch (state->state) {
×
2168
    case SMEMNEXTROW_ENTER: {
×
2169
      if (state->pMem != NULL) {
×
2170
        /*
2171
        if (state->pMem->maxKey <= state->lastTs) {
2172
          *ppRow = NULL;
2173
          *pIgnoreEarlierTs = true;
2174

2175
          TAOS_RETURN(code);
2176
        }
2177
        */
2178
        tsdbTbDataIterOpen(state->pMem, NULL, 1, &state->iter);
×
2179

2180
        TSDBROW *pMemRow = tsdbTbDataIterGet(&state->iter);
×
2181
        if (pMemRow) {
×
2182
          *ppRow = pMemRow;
×
2183
          state->state = SMEMNEXTROW_NEXT;
×
2184

2185
          TAOS_RETURN(code);
×
2186
        }
2187
      }
2188

2189
      *ppRow = NULL;
×
2190

2191
      TAOS_RETURN(code);
×
2192
    }
2193
    case SMEMNEXTROW_NEXT:
×
2194
      if (tsdbTbDataIterNext(&state->iter)) {
×
2195
        *ppRow = tsdbTbDataIterGet(&state->iter);
×
2196

2197
        TAOS_RETURN(code);
×
2198
      } else {
2199
        *ppRow = NULL;
×
2200

2201
        TAOS_RETURN(code);
×
2202
      }
2203
    default:
×
2204
      break;
×
2205
  }
2206

2207
_err:
×
2208
  *ppRow = NULL;
×
2209

2210
  TAOS_RETURN(code);
×
2211
}
2212

2213
typedef int32_t (*_next_row_fn_t)(void *iter, TSDBROW **ppRow, bool *pIgnoreEarlierTs, bool isLast, int16_t *aCols,
2214
                                  int nCols);
2215
typedef int32_t (*_next_row_clear_fn_t)(void *iter);
2216

2217
typedef struct {
2218
  TSDBROW             *pRow;
2219
  bool                 stop;
2220
  bool                 next;
2221
  bool                 ignoreEarlierTs;
2222
  void                *iter;
2223
  _next_row_fn_t       nextRowFn;
2224
  _next_row_clear_fn_t nextRowClearFn;
2225
} TsdbNextRowState;
2226

2227
typedef struct {
2228
  SArray           *pMemDelData;
2229
  SArray           *pSkyline;
2230
  int64_t           iSkyline;
2231
  SBlockIdx         idx;
2232
  SMemNextRowIter   memState;
2233
  SMemNextRowIter   imemState;
2234
  TSDBROW           memRow, imemRow;
2235
  TsdbNextRowState  input[2];
2236
  SCacheRowsReader *pr;
2237
  STsdb            *pTsdb;
2238
} MemNextRowIter;
2239

2240
static int32_t memRowIterOpen(MemNextRowIter *pIter, tb_uid_t uid, STsdb *pTsdb, STSchema *pTSchema, tb_uid_t suid,
×
2241
                              STsdbReadSnap *pReadSnap, SCacheRowsReader *pr) {
2242
  int32_t code = 0, lino = 0;
×
2243

2244
  STbData *pMem = NULL;
×
2245
  if (pReadSnap->pMem) {
×
2246
    pMem = tsdbGetTbDataFromMemTable(pReadSnap->pMem, suid, uid);
×
2247
  }
2248

2249
  STbData *pIMem = NULL;
×
2250
  if (pReadSnap->pIMem) {
×
2251
    pIMem = tsdbGetTbDataFromMemTable(pReadSnap->pIMem, suid, uid);
×
2252
  }
2253

2254
  pIter->pTsdb = pTsdb;
×
2255

2256
  pIter->pMemDelData = NULL;
×
2257

2258
  TAOS_CHECK_GOTO(loadMemTombData(&pIter->pMemDelData, pMem, pIMem, pr->info.verRange.maxVer), &lino, _exit);
×
2259

2260
  pIter->idx = (SBlockIdx){.suid = suid, .uid = uid};
×
2261

2262
  pIter->input[0] = (TsdbNextRowState){&pIter->memRow, true, false, false, &pIter->memState, getNextRowFromMem, NULL};
×
2263
  pIter->input[1] = (TsdbNextRowState){&pIter->imemRow, true, false, false, &pIter->imemState, getNextRowFromMem, NULL};
×
2264

2265
  if (pMem) {
×
2266
    pIter->memState.pMem = pMem;
×
2267
    pIter->memState.state = SMEMNEXTROW_ENTER;
×
2268
    pIter->input[0].stop = false;
×
2269
    pIter->input[0].next = true;
×
2270
  }
2271

2272
  if (pIMem) {
×
2273
    pIter->imemState.pMem = pIMem;
×
2274
    pIter->imemState.state = SMEMNEXTROW_ENTER;
×
2275
    pIter->input[1].stop = false;
×
2276
    pIter->input[1].next = true;
×
2277
  }
2278

2279
  pIter->pr = pr;
×
2280

2281
_exit:
×
2282
  if (code) {
×
2283
    tsdbError("tsdb/cache: %s failed at line %d since %s.", __func__, lino, tstrerror(code));
×
2284
  }
2285

2286
  TAOS_RETURN(code);
×
2287
}
2288

2289
static void memRowIterClose(MemNextRowIter *pIter) {
×
2290
  for (int i = 0; i < 2; ++i) {
×
2291
    if (pIter->input[i].nextRowClearFn) {
×
2292
      (void)pIter->input[i].nextRowClearFn(pIter->input[i].iter);
×
2293
    }
2294
  }
2295

2296
  if (pIter->pSkyline) {
×
2297
    taosArrayDestroy(pIter->pSkyline);
×
2298
  }
2299

2300
  if (pIter->pMemDelData) {
×
2301
    taosArrayDestroy(pIter->pMemDelData);
×
2302
  }
2303
}
×
2304

2305
static void freeTableInfoFunc(void *param) {
×
2306
  void **p = (void **)param;
×
2307
  taosMemoryFreeClear(*p);
×
2308
}
×
2309

2310
static STableLoadInfo *getTableLoadInfo(SCacheRowsReader *pReader, uint64_t uid) {
×
2311
  if (!pReader->pTableMap) {
×
2312
    pReader->pTableMap = tSimpleHashInit(pReader->numOfTables, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT));
×
2313
    if (!pReader->pTableMap) {
×
2314
      return NULL;
×
2315
    }
2316

2317
    tSimpleHashSetFreeFp(pReader->pTableMap, freeTableInfoFunc);
×
2318
  }
2319

2320
  STableLoadInfo  *pInfo = NULL;
×
2321
  STableLoadInfo **ppInfo = tSimpleHashGet(pReader->pTableMap, &uid, sizeof(uid));
×
2322
  if (!ppInfo) {
×
2323
    pInfo = taosMemoryCalloc(1, sizeof(STableLoadInfo));
×
2324
    if (pInfo) {
×
2325
      if (tSimpleHashPut(pReader->pTableMap, &uid, sizeof(uint64_t), &pInfo, POINTER_BYTES)) {
×
2326
        return NULL;
×
2327
      }
2328
    }
2329

2330
    return pInfo;
×
2331
  }
2332

2333
  return *ppInfo;
×
2334
}
2335

2336
static TSDBROW *memRowIterGet(MemNextRowIter *pIter, bool isLast, int16_t *aCols, int nCols) {
×
2337
  int32_t code = 0, lino = 0;
×
2338

2339
  for (;;) {
×
2340
    for (int i = 0; i < 2; ++i) {
×
2341
      if (pIter->input[i].next && !pIter->input[i].stop) {
×
2342
        TAOS_CHECK_GOTO(pIter->input[i].nextRowFn(pIter->input[i].iter, &pIter->input[i].pRow,
×
2343
                                                  &pIter->input[i].ignoreEarlierTs, isLast, aCols, nCols),
2344
                        &lino, _exit);
2345

2346
        if (pIter->input[i].pRow == NULL) {
×
2347
          pIter->input[i].stop = true;
×
2348
          pIter->input[i].next = false;
×
2349
        }
2350
      }
2351
    }
2352

2353
    if (pIter->input[0].stop && pIter->input[1].stop) {
×
2354
      return NULL;
×
2355
    }
2356

2357
    TSDBROW *max[2] = {0};
×
2358
    int      iMax[2] = {-1, -1};
×
2359
    int      nMax = 0;
×
2360
    SRowKey  maxKey = {.ts = TSKEY_MIN};
×
2361

2362
    for (int i = 0; i < 2; ++i) {
×
2363
      if (!pIter->input[i].stop && pIter->input[i].pRow != NULL) {
×
2364
        STsdbRowKey tsdbRowKey = {0};
×
2365
        tsdbRowGetKey(pIter->input[i].pRow, &tsdbRowKey);
×
2366

2367
        // merging & deduplicating on client side
2368
        int c = tRowKeyCompare(&maxKey, &tsdbRowKey.key);
×
2369
        if (c <= 0) {
×
2370
          if (c < 0) {
×
2371
            nMax = 0;
×
2372
            maxKey = tsdbRowKey.key;
×
2373
          }
2374

2375
          iMax[nMax] = i;
×
2376
          max[nMax++] = pIter->input[i].pRow;
×
2377
        }
2378
        pIter->input[i].next = false;
×
2379
      }
2380
    }
2381

2382
    TSDBROW *merge[2] = {0};
×
2383
    int      iMerge[2] = {-1, -1};
×
2384
    int      nMerge = 0;
×
2385
    for (int i = 0; i < nMax; ++i) {
×
2386
      TSDBKEY maxKey1 = TSDBROW_KEY(max[i]);
×
2387

2388
      if (!pIter->pSkyline) {
×
2389
        pIter->pSkyline = taosArrayInit(32, sizeof(TSDBKEY));
×
2390
        TSDB_CHECK_NULL(pIter->pSkyline, code, lino, _exit, terrno);
×
2391

2392
        uint64_t        uid = pIter->idx.uid;
×
2393
        STableLoadInfo *pInfo = getTableLoadInfo(pIter->pr, uid);
×
2394
        TSDB_CHECK_NULL(pInfo, code, lino, _exit, TSDB_CODE_OUT_OF_MEMORY);
×
2395

2396
        if (pInfo->pTombData == NULL) {
×
2397
          pInfo->pTombData = taosArrayInit(4, sizeof(SDelData));
×
2398
          TSDB_CHECK_NULL(pInfo->pTombData, code, lino, _exit, terrno);
×
2399
        }
2400

2401
        if (!taosArrayAddAll(pInfo->pTombData, pIter->pMemDelData)) {
×
2402
          TAOS_CHECK_GOTO(terrno, &lino, _exit);
×
2403
        }
2404

2405
        size_t delSize = TARRAY_SIZE(pInfo->pTombData);
×
2406
        if (delSize > 0) {
×
2407
          code = tsdbBuildDeleteSkyline(pInfo->pTombData, 0, (int32_t)(delSize - 1), pIter->pSkyline);
×
2408
          TAOS_CHECK_GOTO(code, &lino, _exit);
×
2409
        }
2410
        pIter->iSkyline = taosArrayGetSize(pIter->pSkyline) - 1;
×
2411
      }
2412

2413
      bool deleted = tsdbKeyDeleted(&maxKey1, pIter->pSkyline, &pIter->iSkyline);
×
2414
      if (!deleted) {
×
2415
        iMerge[nMerge] = iMax[i];
×
2416
        merge[nMerge++] = max[i];
×
2417
      }
2418

2419
      pIter->input[iMax[i]].next = deleted;
×
2420
    }
2421

2422
    if (nMerge > 0) {
×
2423
      pIter->input[iMerge[0]].next = true;
×
2424

2425
      return merge[0];
×
2426
    }
2427
  }
2428

2429
_exit:
×
2430
  if (code) {
×
2431
    tsdbError("tsdb/cache: %s failed at line %d since %s.", __func__, lino, tstrerror(code));
×
2432
  }
2433

2434
  return NULL;
×
2435
}
2436

2437
static int32_t cloneTSchema(STSchema *pSrc, STSchema **ppDst) {
×
2438
  int32_t len = sizeof(STSchema) + sizeof(STColumn) * pSrc->numOfCols;
×
2439
  *ppDst = taosMemoryMalloc(len);
×
2440
  if (NULL == *ppDst) {
×
2441
    TAOS_RETURN(terrno);
×
2442
  }
2443
  memcpy(*ppDst, pSrc, len);
×
2444

2445
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
2446
}
2447

2448
static int32_t updateTSchema(int32_t sversion, SCacheRowsReader *pReader, uint64_t uid) {
×
2449
  if (NULL == pReader->pCurrSchema && sversion == pReader->pSchema->version) {
×
2450
    TAOS_RETURN(cloneTSchema(pReader->pSchema, &pReader->pCurrSchema));
×
2451
  }
2452

2453
  if (NULL != pReader->pCurrSchema && sversion == pReader->pCurrSchema->version) {
×
2454
    TAOS_RETURN(TSDB_CODE_SUCCESS);
×
2455
  }
2456

2457
  taosMemoryFreeClear(pReader->pCurrSchema);
×
2458
  TAOS_RETURN(
×
2459
      metaGetTbTSchemaEx(pReader->pTsdb->pVnode->pMeta, pReader->info.suid, uid, sversion, &pReader->pCurrSchema));
2460
}
2461

2462
static int32_t tsdbCacheGetBatchFromMem(STsdb *pTsdb, tb_uid_t uid, SArray *pLastArray, SCacheRowsReader *pr,
×
2463
                                        SArray *keyArray) {
2464
  int32_t        code = 0;
×
2465
  int32_t        lino = 0;
×
2466
  STSchema      *pTSchema = pr->pSchema;
×
2467
  SLRUCache     *pCache = pTsdb->lruCache;
×
2468
  SArray        *pCidList = pr->pCidList;
×
2469
  int            numKeys = TARRAY_SIZE(pCidList);
×
2470
  MemNextRowIter iter = {0};
×
2471
  SSHashObj     *iColHash = NULL;
×
2472
  STSDBRowIter   rowIter = {0};
×
2473

2474
  // 1, get from mem, imem filtered with delete info
2475
  TAOS_CHECK_EXIT(memRowIterOpen(&iter, uid, pTsdb, pTSchema, pr->info.suid, pr->pReadSnap, pr));
×
2476

2477
  TSDBROW *pRow = memRowIterGet(&iter, false, NULL, 0);
×
2478
  if (!pRow) {
×
2479
    goto _exit;
×
2480
  }
2481

2482
  int32_t sversion = TSDBROW_SVERSION(pRow);
×
2483
  if (sversion != -1) {
×
2484
    TAOS_CHECK_EXIT(updateTSchema(sversion, pr, uid));
×
2485

2486
    pTSchema = pr->pCurrSchema;
×
2487
  }
2488
  int32_t nCol = pTSchema->numOfCols;
×
2489

2490
  STsdbRowKey rowKey = {0};
×
2491
  tsdbRowGetKey(pRow, &rowKey);
×
2492

2493
  TAOS_CHECK_EXIT(tsdbRowIterOpen(&rowIter, pRow, pTSchema));
×
2494

2495
  int32_t iCol = 0, jCol = 0, jnCol = TARRAY_SIZE(pLastArray);
×
2496
  for (SColVal *pColVal = tsdbRowIterNext(&rowIter); pColVal && iCol < nCol && jCol < jnCol;) {
×
2497
    SLastCol *pTargetCol = &((SLastCol *)TARRAY_DATA(pLastArray))[jCol];
×
2498
    if (pColVal->cid < pTargetCol->colVal.cid) {
×
2499
      pColVal = tsdbRowIterNext(&rowIter), ++iCol;
×
2500

2501
      continue;
×
2502
    }
2503
    if (pColVal->cid > pTargetCol->colVal.cid) {
×
2504
      break;
×
2505
    }
2506

2507
    int32_t cmp_res = tRowKeyCompare(&pTargetCol->rowKey, &rowKey.key);
×
2508
    if (!IS_LAST_KEY(((SLastKey *)TARRAY_DATA(keyArray))[jCol])) {
×
2509
      if (cmp_res < 0 || (cmp_res == 0 && !COL_VAL_IS_NONE(pColVal))) {
×
2510
        SLastCol lastCol = {.rowKey = rowKey.key, .colVal = *pColVal, .dirty = 1, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
2511
        TAOS_CHECK_EXIT(tsdbCacheReallocSLastCol(&lastCol, NULL));
×
2512

2513
        tsdbCacheFreeSLastColItem(pTargetCol);
×
2514
        taosArraySet(pLastArray, jCol, &lastCol);
×
2515
      }
2516
    } else {
2517
      if (COL_VAL_IS_VALUE(pColVal)) {
×
2518
        if (cmp_res <= 0) {
×
2519
          SLastCol lastCol = {
×
2520
              .rowKey = rowKey.key, .colVal = *pColVal, .dirty = 1, .cacheStatus = TSDB_LAST_CACHE_VALID};
2521
          TAOS_CHECK_EXIT(tsdbCacheReallocSLastCol(&lastCol, NULL));
×
2522

2523
          tsdbCacheFreeSLastColItem(pTargetCol);
×
2524
          taosArraySet(pLastArray, jCol, &lastCol);
×
2525
        }
2526
      } else {
2527
        if (!iColHash) {
×
2528
          iColHash = tSimpleHashInit(16, taosGetDefaultHashFunction(TSDB_DATA_TYPE_SMALLINT));
×
2529
          if (iColHash == NULL) {
×
2530
            TAOS_CHECK_EXIT(terrno);
×
2531
          }
2532
        }
2533

2534
        if (tSimpleHashPut(iColHash, &pColVal->cid, sizeof(pColVal->cid), &jCol, sizeof(jCol))) {
×
2535
          TAOS_CHECK_EXIT(terrno);
×
2536
        }
2537
      }
2538
    }
2539

2540
    ++jCol;
×
2541

2542
    if (jCol < jnCol && ((SLastCol *)TARRAY_DATA(pLastArray))[jCol].colVal.cid > pColVal->cid) {
×
2543
      pColVal = tsdbRowIterNext(&rowIter), ++iCol;
×
2544
    }
2545
  }
2546
  tsdbRowClose(&rowIter);
×
2547

2548
  if (iColHash && tSimpleHashGetSize(iColHash) > 0) {
×
2549
    pRow = memRowIterGet(&iter, false, NULL, 0);
×
2550
    while (pRow) {
×
2551
      if (tSimpleHashGetSize(iColHash) == 0) {
×
2552
        break;
×
2553
      }
2554

2555
      sversion = TSDBROW_SVERSION(pRow);
×
2556
      if (sversion != -1) {
×
2557
        TAOS_CHECK_EXIT(updateTSchema(sversion, pr, uid));
×
2558

2559
        pTSchema = pr->pCurrSchema;
×
2560
      }
2561
      nCol = pTSchema->numOfCols;
×
2562

2563
      STsdbRowKey tsdbRowKey = {0};
×
2564
      tsdbRowGetKey(pRow, &tsdbRowKey);
×
2565

2566
      TAOS_CHECK_EXIT(tsdbRowIterOpen(&rowIter, pRow, pTSchema));
×
2567

2568
      iCol = 0;
×
2569
      for (SColVal *pColVal = tsdbRowIterNext(&rowIter); pColVal && iCol < nCol;
×
2570
           pColVal = tsdbRowIterNext(&rowIter), iCol++) {
×
2571
        int32_t *pjCol = tSimpleHashGet(iColHash, &pColVal->cid, sizeof(pColVal->cid));
×
2572
        if (pjCol && COL_VAL_IS_VALUE(pColVal)) {
×
2573
          SLastCol *pTargetCol = &((SLastCol *)TARRAY_DATA(pLastArray))[*pjCol];
×
2574

2575
          int32_t cmp_res = tRowKeyCompare(&pTargetCol->rowKey, &tsdbRowKey.key);
×
2576
          if (cmp_res <= 0) {
×
2577
            SLastCol lastCol = {
×
2578
                .rowKey = tsdbRowKey.key, .colVal = *pColVal, .dirty = 1, .cacheStatus = TSDB_LAST_CACHE_VALID};
2579
            TAOS_CHECK_EXIT(tsdbCacheReallocSLastCol(&lastCol, NULL));
×
2580

2581
            tsdbCacheFreeSLastColItem(pTargetCol);
×
2582
            taosArraySet(pLastArray, *pjCol, &lastCol);
×
2583
          }
2584

2585
          TAOS_CHECK_EXIT(tSimpleHashRemove(iColHash, &pColVal->cid, sizeof(pColVal->cid)));
×
2586
        }
2587
      }
2588
      tsdbRowClose(&rowIter);
×
2589

2590
      pRow = memRowIterGet(&iter, false, NULL, 0);
×
2591
    }
2592
  }
2593

2594
_exit:
×
2595
  if (code) {
×
2596
    tsdbError("vgId:%d %s failed at %s:%d since %s", TD_VID(pTsdb->pVnode), __func__, __FILE__, lino, tstrerror(code));
×
2597

2598
    tsdbRowClose(&rowIter);
×
2599
  }
2600

2601
  tSimpleHashCleanup(iColHash);
×
2602

2603
  memRowIterClose(&iter);
×
2604

2605
  TAOS_RETURN(code);
×
2606
}
2607

2608
int32_t tsdbCacheGetBatch(STsdb *pTsdb, tb_uid_t uid, SArray *pLastArray, SCacheRowsReader *pr, int8_t ltype) {
×
2609
  int32_t code = 0;
×
2610
  int32_t lino = 0;
×
2611

2612
  SArray *keyArray = taosArrayInit(16, sizeof(SLastKey));
×
2613
  if (!keyArray) {
×
2614
    TAOS_CHECK_EXIT(terrno);
×
2615
  }
2616

2617
  TAOS_CHECK_EXIT(tsdbCacheGetBatchFromLru(pTsdb, uid, pLastArray, pr, ltype, keyArray));
×
2618

2619
  if (tsUpdateCacheBatch) {
×
2620
    TAOS_CHECK_EXIT(tsdbCacheGetBatchFromMem(pTsdb, uid, pLastArray, pr, keyArray));
×
2621
  }
2622

2623
_exit:
×
2624
  if (code) {
×
2625
    tsdbError("vgId:%d %s failed at %s:%d since %s", TD_VID(pTsdb->pVnode), __func__, __FILE__, lino, tstrerror(code));
×
2626
  }
2627

2628
  if (keyArray) {
×
2629
    taosArrayDestroy(keyArray);
×
2630
  }
2631

2632
  TAOS_RETURN(code);
×
2633
}
2634

2635
int32_t tsdbCacheDel(STsdb *pTsdb, tb_uid_t suid, tb_uid_t uid, TSKEY sKey, TSKEY eKey) {
×
2636
  int32_t   code = 0, lino = 0;
×
2637
  STSchema *pTSchema = NULL;
×
2638
  int       sver = -1;
×
2639
  int       numKeys = 0;
×
2640
  SArray   *remainCols = NULL;
×
2641

2642
  TAOS_CHECK_RETURN(metaGetTbTSchemaEx(pTsdb->pVnode->pMeta, suid, uid, sver, &pTSchema));
×
2643

2644
  int numCols = pTSchema->numOfCols;
×
2645

2646
  (void)taosThreadMutexLock(&pTsdb->lruMutex);
×
2647

2648
  for (int i = 0; i < numCols; ++i) {
×
2649
    int16_t cid = pTSchema->columns[i].colId;
×
2650
    for (int8_t lflag = LFLAG_LAST_ROW; lflag <= LFLAG_LAST; ++lflag) {
×
2651
      SLastKey   lastKey = {.lflag = lflag, .uid = uid, .cid = cid};
×
2652
      LRUHandle *h = taosLRUCacheLookup(pTsdb->lruCache, &lastKey, ROCKS_KEY_LEN);
×
2653
      if (h) {
×
2654
        SLastCol *pLastCol = (SLastCol *)taosLRUCacheValue(pTsdb->lruCache, h);
×
2655
        if (pLastCol->rowKey.ts <= eKey && pLastCol->rowKey.ts >= sKey) {
×
2656
          SLastCol noneCol = {.rowKey.ts = TSKEY_MIN,
×
2657
                              .colVal = COL_VAL_NONE(cid, pTSchema->columns[i].type),
×
2658
                              .dirty = 1,
2659
                              .cacheStatus = TSDB_LAST_CACHE_NO_CACHE};
2660
          code = tsdbCachePutToLRU(pTsdb, &lastKey, &noneCol, 1);
×
2661
        }
2662
        tsdbLRUCacheRelease(pTsdb->lruCache, h, false);
×
2663
        TAOS_CHECK_EXIT(code);
×
2664
      } else {
2665
        if (!remainCols) {
×
2666
          remainCols = taosArrayInit(numCols * 2, sizeof(SIdxKey));
×
2667
        }
2668
        if (!taosArrayPush(remainCols, &(SIdxKey){i, lastKey})) {
×
2669
          TAOS_CHECK_EXIT(terrno);
×
2670
        }
2671
      }
2672
    }
2673
  }
2674

2675
  if (remainCols) {
×
2676
    numKeys = TARRAY_SIZE(remainCols);
×
2677
  }
2678

2679
  char  **keys_list = taosMemoryCalloc(numKeys, sizeof(char *));
×
2680
  size_t *keys_list_sizes = taosMemoryCalloc(numKeys, sizeof(size_t));
×
2681
  char  **values_list = NULL;
×
2682
  size_t *values_list_sizes = NULL;
×
2683

2684
  if (!keys_list || !keys_list_sizes) {
×
2685
    code = terrno;
×
2686
    goto _exit;
×
2687
  }
2688
  const size_t klen = ROCKS_KEY_LEN;
×
2689

2690
  for (int i = 0; i < numKeys; ++i) {
×
2691
    char *key = taosMemoryCalloc(1, sizeof(SLastKey));
×
2692
    if (!key) {
×
2693
      code = terrno;
×
2694
      goto _exit;
×
2695
    }
2696
    SIdxKey *idxKey = taosArrayGet(remainCols, i);
×
2697

2698
    ((SLastKey *)key)[0] = idxKey->key;
×
2699

2700
    keys_list[i] = key;
×
2701
    keys_list_sizes[i] = klen;
×
2702
  }
2703

2704
  rocksMayWrite(pTsdb, true);  // flush writebatch cache
×
2705

2706
  TAOS_CHECK_GOTO(tsdbCacheGetValuesFromRocks(pTsdb, numKeys, (const char *const *)keys_list, keys_list_sizes,
×
2707
                                              &values_list, &values_list_sizes),
2708
                  NULL, _exit);
2709

2710
  rocksdb_writebatch_t *wb = pTsdb->rCache.writebatch;
×
2711
  for (int i = 0; i < numKeys; ++i) {
×
2712
    SLastCol *pLastCol = NULL;
×
2713
    if (values_list[i] != NULL) {
×
2714
      code = tsdbCacheDeserialize(values_list[i], values_list_sizes[i], &pLastCol);
×
2715
      if (code != TSDB_CODE_SUCCESS) {
×
2716
        tsdbError("vgId:%d, %s deserialize failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
2717
                  tstrerror(code));
2718
        goto _exit;
×
2719
      }
2720
    }
2721
    SIdxKey  *idxKey = taosArrayGet(remainCols, i);
×
2722
    SLastKey *pLastKey = &idxKey->key;
×
2723
    if (NULL != pLastCol && (pLastCol->rowKey.ts <= eKey && pLastCol->rowKey.ts >= sKey)) {
×
2724
      SLastCol noCacheCol = {.rowKey.ts = TSKEY_MIN,
×
2725
                             .colVal = COL_VAL_NONE(pLastKey->cid, pTSchema->columns[idxKey->idx].type),
×
2726
                             .dirty = 0,
2727
                             .cacheStatus = TSDB_LAST_CACHE_NO_CACHE};
2728

2729
      if ((code = tsdbCachePutToRocksdb(pTsdb, pLastKey, &noCacheCol)) != TSDB_CODE_SUCCESS) {
×
2730
        taosMemoryFreeClear(pLastCol);
×
2731
        tsdbError("tsdb/cache/del: vgId:%d, put to rocks failed since %s.", TD_VID(pTsdb->pVnode), tstrerror(code));
×
2732
        goto _exit;
×
2733
      }
2734
      if ((code = tsdbCachePutToLRU(pTsdb, pLastKey, &noCacheCol, 0)) != TSDB_CODE_SUCCESS) {
×
2735
        taosMemoryFreeClear(pLastCol);
×
2736
        tsdbError("tsdb/cache/del: vgId:%d, put to lru failed since %s.", TD_VID(pTsdb->pVnode), tstrerror(code));
×
2737
        goto _exit;
×
2738
      }
2739
    }
2740

2741
    if (pLastCol == NULL) {
×
2742
      tsdbDebug("tsdb/cache/del: vgId:%d, no cache found for uid:%d ,cid:%" PRId64 ", lflag:%d.", TD_VID(pTsdb->pVnode),
×
2743
                pLastKey->cid, pLastKey->uid, pLastKey->lflag);
2744
    }
2745

2746
    taosMemoryFreeClear(pLastCol);
×
2747
  }
2748

2749
  rocksMayWrite(pTsdb, false);
×
2750

2751
_exit:
×
2752
  (void)taosThreadMutexUnlock(&pTsdb->lruMutex);
×
2753

2754
  for (int i = 0; i < numKeys; ++i) {
×
2755
    taosMemoryFree(keys_list[i]);
×
2756
  }
2757
  taosMemoryFree(keys_list);
×
2758
  taosMemoryFree(keys_list_sizes);
×
2759
  if (values_list) {
×
2760
    for (int i = 0; i < numKeys; ++i) {
×
2761
      rocksdb_free(values_list[i]);
×
2762
    }
2763
    taosMemoryFree(values_list);
×
2764
  }
2765
  taosMemoryFree(values_list_sizes);
×
2766
  taosArrayDestroy(remainCols);
×
2767
  taosMemoryFree(pTSchema);
×
2768

2769
  TAOS_RETURN(code);
×
2770
}
2771

2772
int32_t tsdbOpenCache(STsdb *pTsdb) {
×
2773
  int32_t code = 0, lino = 0;
×
2774
  size_t  cfgCapacity = (size_t)pTsdb->pVnode->config.cacheLastSize * 1024 * 1024;
×
2775

2776
  SLRUCache *pCache = taosLRUCacheInit(cfgCapacity, 0, .5);
×
2777
  if (pCache == NULL) {
×
2778
    TAOS_CHECK_GOTO(TSDB_CODE_OUT_OF_MEMORY, &lino, _err);
×
2779
  }
2780

2781
  TAOS_CHECK_GOTO(tsdbOpenBCache(pTsdb), &lino, _err);
×
2782

2783
  TAOS_CHECK_GOTO(tsdbOpenPgCache(pTsdb), &lino, _err);
×
2784

2785
  TAOS_CHECK_GOTO(tsdbOpenRocksCache(pTsdb), &lino, _err);
×
2786

2787
  taosLRUCacheSetStrictCapacity(pCache, false);
×
2788

2789
  (void)taosThreadMutexInit(&pTsdb->lruMutex, NULL);
×
2790

2791
_err:
×
2792
  if (code) {
×
2793
    tsdbError("tsdb/cache: vgId:%d, open failed at line %d since %s.", TD_VID(pTsdb->pVnode), lino, tstrerror(code));
×
2794
  }
2795

2796
  pTsdb->lruCache = pCache;
×
2797

2798
  TAOS_RETURN(code);
×
2799
}
2800

2801
void tsdbCloseCache(STsdb *pTsdb) {
×
2802
  SLRUCache *pCache = pTsdb->lruCache;
×
2803
  if (pCache) {
×
2804
    taosLRUCacheEraseUnrefEntries(pCache);
×
2805

2806
    taosLRUCacheCleanup(pCache);
×
2807

2808
    (void)taosThreadMutexDestroy(&pTsdb->lruMutex);
×
2809
  }
2810

2811
  tsdbCloseBCache(pTsdb);
×
2812
  tsdbClosePgCache(pTsdb);
×
2813
  tsdbCloseRocksCache(pTsdb);
×
2814
}
×
2815

2816
static void getTableCacheKey(tb_uid_t uid, int cacheType, char *key, int *len) {
×
2817
  if (cacheType == 0) {  // last_row
×
2818
    *(uint64_t *)key = (uint64_t)uid;
×
2819
  } else {  // last
2820
    *(uint64_t *)key = ((uint64_t)uid) | 0x8000000000000000;
×
2821
  }
2822

2823
  *len = sizeof(uint64_t);
×
2824
}
×
2825

2826
static tb_uid_t getTableSuidByUid(tb_uid_t uid, STsdb *pTsdb) {
×
2827
  tb_uid_t suid = 0;
×
2828

2829
  SMetaReader mr = {0};
×
2830
  metaReaderDoInit(&mr, pTsdb->pVnode->pMeta, META_READER_LOCK);
×
2831
  if (metaReaderGetTableEntryByUidCache(&mr, uid) < 0) {
×
2832
    metaReaderClear(&mr);  // table not esist
×
2833
    return 0;
×
2834
  }
2835

2836
  if (mr.me.type == TSDB_CHILD_TABLE) {
×
2837
    suid = mr.me.ctbEntry.suid;
×
2838
  } else if (mr.me.type == TSDB_NORMAL_TABLE) {
×
2839
    suid = 0;
×
2840
  } else {
2841
    suid = 0;
×
2842
  }
2843

2844
  metaReaderClear(&mr);
×
2845

2846
  return suid;
×
2847
}
2848

2849
static int32_t getTableDelDataFromDelIdx(SDelFReader *pDelReader, SDelIdx *pDelIdx, SArray *aDelData) {
×
2850
  int32_t code = 0;
×
2851

2852
  if (pDelIdx) {
×
2853
    code = tsdbReadDelDatav1(pDelReader, pDelIdx, aDelData, INT64_MAX);
×
2854
  }
2855

2856
  TAOS_RETURN(code);
×
2857
}
2858

2859
static int32_t getTableDelDataFromTbData(STbData *pTbData, SArray *aDelData) {
×
2860
  int32_t   code = 0;
×
2861
  SDelData *pDelData = pTbData ? pTbData->pHead : NULL;
×
2862

2863
  for (; pDelData; pDelData = pDelData->pNext) {
×
2864
    if (!taosArrayPush(aDelData, pDelData)) {
×
2865
      TAOS_RETURN(terrno);
×
2866
    }
2867
  }
2868

2869
  TAOS_RETURN(code);
×
2870
}
2871

2872
static uint64_t *getUidList(SCacheRowsReader *pReader) {
×
2873
  if (!pReader->uidList) {
×
2874
    int32_t numOfTables = pReader->numOfTables;
×
2875

2876
    pReader->uidList = taosMemoryMalloc(numOfTables * sizeof(uint64_t));
×
2877
    if (!pReader->uidList) {
×
2878
      return NULL;
×
2879
    }
2880

2881
    for (int32_t i = 0; i < numOfTables; ++i) {
×
2882
      uint64_t uid = pReader->pTableList[i].uid;
×
2883
      pReader->uidList[i] = uid;
×
2884
    }
2885

2886
    taosSort(pReader->uidList, numOfTables, sizeof(uint64_t), uidComparFunc);
×
2887
  }
2888

2889
  return pReader->uidList;
×
2890
}
2891

2892
static int32_t loadTombFromBlk(const TTombBlkArray *pTombBlkArray, SCacheRowsReader *pReader, void *pFileReader,
×
2893
                               bool isFile) {
2894
  int32_t   code = 0;
×
2895
  int32_t   numOfTables = pReader->numOfTables;
×
2896
  int64_t   suid = pReader->info.suid;
×
2897
  uint64_t *uidList = getUidList(pReader);
×
2898

2899
  if (!uidList) {
×
2900
    TAOS_RETURN(terrno);
×
2901
  }
2902

2903
  for (int i = 0, j = 0; i < pTombBlkArray->size && j < numOfTables; ++i) {
×
2904
    STombBlk *pTombBlk = &pTombBlkArray->data[i];
×
2905
    if (pTombBlk->maxTbid.suid < suid || (pTombBlk->maxTbid.suid == suid && pTombBlk->maxTbid.uid < uidList[0])) {
×
2906
      continue;
×
2907
    }
2908

2909
    if (pTombBlk->minTbid.suid > suid ||
×
2910
        (pTombBlk->minTbid.suid == suid && pTombBlk->minTbid.uid > uidList[numOfTables - 1])) {
×
2911
      break;
2912
    }
2913

2914
    STombBlock block = {0};
×
2915
    code = isFile ? tsdbDataFileReadTombBlock(pFileReader, &pTombBlkArray->data[i], &block)
×
2916
                  : tsdbSttFileReadTombBlock(pFileReader, &pTombBlkArray->data[i], &block);
×
2917
    if (code != TSDB_CODE_SUCCESS) {
×
2918
      TAOS_RETURN(code);
×
2919
    }
2920

2921
    uint64_t        uid = uidList[j];
×
2922
    STableLoadInfo *pInfo = getTableLoadInfo(pReader, uid);
×
2923
    if (!pInfo) {
×
2924
      tTombBlockDestroy(&block);
×
2925
      TAOS_RETURN(TSDB_CODE_OUT_OF_MEMORY);
×
2926
    }
2927

2928
    if (pInfo->pTombData == NULL) {
×
2929
      pInfo->pTombData = taosArrayInit(4, sizeof(SDelData));
×
2930
    }
2931

2932
    STombRecord record = {0};
×
2933
    bool        finished = false;
×
2934
    for (int32_t k = 0; k < TOMB_BLOCK_SIZE(&block); ++k) {
×
2935
      code = tTombBlockGet(&block, k, &record);
×
2936
      if (code != TSDB_CODE_SUCCESS) {
×
2937
        finished = true;
×
2938
        break;
×
2939
      }
2940

2941
      if (record.suid < suid) {
×
2942
        continue;
×
2943
      }
2944
      if (record.suid > suid) {
×
2945
        finished = true;
×
2946
        break;
×
2947
      }
2948

2949
      bool newTable = false;
×
2950
      if (uid < record.uid) {
×
2951
        while (j < numOfTables && uidList[j] < record.uid) {
×
2952
          ++j;
×
2953
          newTable = true;
×
2954
        }
2955

2956
        if (j >= numOfTables) {
×
2957
          finished = true;
×
2958
          break;
×
2959
        }
2960

2961
        uid = uidList[j];
×
2962
      }
2963

2964
      if (record.uid < uid) {
×
2965
        continue;
×
2966
      }
2967

2968
      if (newTable) {
×
2969
        pInfo = getTableLoadInfo(pReader, uid);
×
2970
        if (!pInfo) {
×
2971
          code = TSDB_CODE_OUT_OF_MEMORY;
×
2972
          finished = true;
×
2973
          break;
×
2974
        }
2975
        if (pInfo->pTombData == NULL) {
×
2976
          pInfo->pTombData = taosArrayInit(4, sizeof(SDelData));
×
2977
          if (!pInfo->pTombData) {
×
2978
            code = terrno;
×
2979
            finished = true;
×
2980
            break;
×
2981
          }
2982
        }
2983
      }
2984

2985
      if (record.version <= pReader->info.verRange.maxVer) {
×
2986
        /*tsdbError("tomb xx load/cache: vgId:%d fid:%d record %" PRId64 "~%" PRId64 "~%" PRId64 " tomb records",
2987
          TD_VID(pReader->pTsdb->pVnode), pReader->pCurFileSet->fid, record.skey, record.ekey, uid);*/
2988

2989
        SDelData delData = {.version = record.version, .sKey = record.skey, .eKey = record.ekey};
×
2990
        if (!taosArrayPush(pInfo->pTombData, &delData)) {
×
2991
          TAOS_RETURN(terrno);
×
2992
        }
2993
      }
2994
    }
2995

2996
    tTombBlockDestroy(&block);
×
2997

2998
    if (finished) {
×
2999
      TAOS_RETURN(code);
×
3000
    }
3001
  }
3002

3003
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
3004
}
3005

3006
static int32_t loadDataTomb(SCacheRowsReader *pReader, SDataFileReader *pFileReader) {
×
3007
  const TTombBlkArray *pBlkArray = NULL;
×
3008

3009
  TAOS_CHECK_RETURN(tsdbDataFileReadTombBlk(pFileReader, &pBlkArray));
×
3010

3011
  TAOS_RETURN(loadTombFromBlk(pBlkArray, pReader, pFileReader, true));
×
3012
}
3013

3014
static int32_t loadSttTomb(STsdbReader *pTsdbReader, SSttFileReader *pSttFileReader, SSttBlockLoadInfo *pLoadInfo) {
×
3015
  SCacheRowsReader    *pReader = (SCacheRowsReader *)pTsdbReader;
×
3016
  const TTombBlkArray *pBlkArray = NULL;
×
3017

3018
  TAOS_CHECK_RETURN(tsdbSttFileReadTombBlk(pSttFileReader, &pBlkArray));
×
3019

3020
  TAOS_RETURN(loadTombFromBlk(pBlkArray, pReader, pSttFileReader, false));
×
3021
}
3022

3023
typedef struct {
3024
  SMergeTree  mergeTree;
3025
  SMergeTree *pMergeTree;
3026
} SFSLastIter;
3027

3028
static int32_t lastIterOpen(SFSLastIter *iter, STFileSet *pFileSet, STsdb *pTsdb, STSchema *pTSchema, tb_uid_t suid,
×
3029
                            tb_uid_t uid, SCacheRowsReader *pr, int64_t lastTs, int16_t *aCols, int nCols) {
3030
  int32_t code = 0;
×
3031
  destroySttBlockReader(pr->pLDataIterArray, NULL);
×
3032
  pr->pLDataIterArray = taosArrayInit(4, POINTER_BYTES);
×
3033
  if (pr->pLDataIterArray == NULL) return terrno;
×
3034

3035
  SMergeTreeConf conf = {
×
3036
      .uid = uid,
3037
      .suid = suid,
3038
      .pTsdb = pTsdb,
3039
      .timewindow = (STimeWindow){.skey = lastTs, .ekey = TSKEY_MAX},
3040
      .verRange = (SVersionRange){.minVer = 0, .maxVer = INT64_MAX},
3041
      .strictTimeRange = false,
3042
      .pSchema = pTSchema,
3043
      .pCurrentFileset = pFileSet,
3044
      .backward = 1,
3045
      .pSttFileBlockIterArray = pr->pLDataIterArray,
×
3046
      .pCols = aCols,
3047
      .numOfCols = nCols,
3048
      .loadTombFn = loadSttTomb,
3049
      .pReader = pr,
3050
      .idstr = pr->idstr,
×
3051
      .pCurRowKey = &pr->rowKey,
×
3052
  };
3053

3054
  TAOS_CHECK_RETURN(tMergeTreeOpen2(&iter->mergeTree, &conf, NULL));
×
3055

3056
  iter->pMergeTree = &iter->mergeTree;
×
3057

3058
  TAOS_RETURN(code);
×
3059
}
3060

3061
static int32_t lastIterClose(SFSLastIter **iter) {
×
3062
  int32_t code = 0;
×
3063

3064
  if ((*iter)->pMergeTree) {
×
3065
    tMergeTreeClose((*iter)->pMergeTree);
×
3066
    (*iter)->pMergeTree = NULL;
×
3067
  }
3068

3069
  *iter = NULL;
×
3070

3071
  TAOS_RETURN(code);
×
3072
}
3073

3074
static int32_t lastIterNext(SFSLastIter *iter, TSDBROW **ppRow) {
×
3075
  bool hasVal = false;
×
3076
  *ppRow = NULL;
×
3077

3078
  int32_t code = tMergeTreeNext(iter->pMergeTree, &hasVal);
×
3079
  if (code != 0) {
×
3080
    return code;
×
3081
  }
3082

3083
  if (!hasVal) {
×
3084
    *ppRow = NULL;
×
3085
    TAOS_RETURN(code);
×
3086
  }
3087

3088
  *ppRow = tMergeTreeGetRow(iter->pMergeTree);
×
3089
  TAOS_RETURN(code);
×
3090
}
3091

3092
typedef enum SFSNEXTROWSTATES {
3093
  SFSNEXTROW_FS,
3094
  SFSNEXTROW_FILESET,
3095
  SFSNEXTROW_INDEXLIST,
3096
  SFSNEXTROW_BRINBLOCK,
3097
  SFSNEXTROW_BRINRECORD,
3098
  SFSNEXTROW_BLOCKDATA,
3099
  SFSNEXTROW_BLOCKROW,
3100
  SFSNEXTROW_NEXTSTTROW
3101
} SFSNEXTROWSTATES;
3102

3103
struct CacheNextRowIter;
3104

3105
typedef struct SFSNextRowIter {
3106
  SFSNEXTROWSTATES         state;         // [input]
3107
  SBlockIdx               *pBlockIdxExp;  // [input]
3108
  STSchema                *pTSchema;      // [input]
3109
  tb_uid_t                 suid;
3110
  tb_uid_t                 uid;
3111
  int32_t                  iFileSet;
3112
  STFileSet               *pFileSet;
3113
  TFileSetArray           *aDFileSet;
3114
  SArray                  *pIndexList;
3115
  int32_t                  iBrinIndex;
3116
  SBrinBlock               brinBlock;
3117
  SBrinBlock              *pBrinBlock;
3118
  int32_t                  iBrinRecord;
3119
  SBrinRecord              brinRecord;
3120
  SBlockData               blockData;
3121
  SBlockData              *pBlockData;
3122
  int32_t                  nRow;
3123
  int32_t                  iRow;
3124
  TSDBROW                  row;
3125
  int64_t                  lastTs;
3126
  SFSLastIter              lastIter;
3127
  SFSLastIter             *pLastIter;
3128
  int8_t                   lastEmpty;
3129
  TSDBROW                 *pLastRow;
3130
  SRow                    *pTSRow;
3131
  SRowMerger               rowMerger;
3132
  SCacheRowsReader        *pr;
3133
  struct CacheNextRowIter *pRowIter;
3134
} SFSNextRowIter;
3135

3136
static void clearLastFileSet(SFSNextRowIter *state);
3137

3138
static int32_t getNextRowFromFS(void *iter, TSDBROW **ppRow, bool *pIgnoreEarlierTs, bool isLast, int16_t *aCols,
×
3139
                                int nCols) {
3140
  int32_t         code = 0, lino = 0;
×
3141
  SFSNextRowIter *state = (SFSNextRowIter *)iter;
×
3142
  STsdb          *pTsdb = state->pr->pTsdb;
×
3143

3144
  if (SFSNEXTROW_FS == state->state) {
×
3145
    state->iFileSet = TARRAY2_SIZE(state->aDFileSet);
×
3146

3147
    state->state = SFSNEXTROW_FILESET;
×
3148
  }
3149

3150
  if (SFSNEXTROW_FILESET == state->state) {
×
3151
  _next_fileset:
×
3152
    clearLastFileSet(state);
×
3153

3154
    if (--state->iFileSet < 0) {
×
3155
      *ppRow = NULL;
×
3156

3157
      TAOS_RETURN(code);
×
3158
    } else {
3159
      state->pFileSet = TARRAY2_GET(state->aDFileSet, state->iFileSet);
×
3160
    }
3161

3162
    STFileObj **pFileObj = state->pFileSet->farr;
×
3163
    if (pFileObj[0] != NULL || pFileObj[3] != NULL) {
×
3164
      if (state->pFileSet != state->pr->pCurFileSet) {
×
3165
        SDataFileReaderConfig conf = {.tsdb = pTsdb, .szPage = pTsdb->pVnode->config.tsdbPageSize};
×
3166
        const char           *filesName[4] = {0};
×
3167
        if (pFileObj[0] != NULL) {
×
3168
          conf.files[0].file = *pFileObj[0]->f;
×
3169
          conf.files[0].exist = true;
×
3170
          filesName[0] = pFileObj[0]->fname;
×
3171

3172
          conf.files[1].file = *pFileObj[1]->f;
×
3173
          conf.files[1].exist = true;
×
3174
          filesName[1] = pFileObj[1]->fname;
×
3175

3176
          conf.files[2].file = *pFileObj[2]->f;
×
3177
          conf.files[2].exist = true;
×
3178
          filesName[2] = pFileObj[2]->fname;
×
3179
        }
3180

3181
        if (pFileObj[3] != NULL) {
×
3182
          conf.files[3].exist = true;
×
3183
          conf.files[3].file = *pFileObj[3]->f;
×
3184
          filesName[3] = pFileObj[3]->fname;
×
3185
        }
3186

3187
        TAOS_CHECK_GOTO(tsdbDataFileReaderOpen(filesName, &conf, &state->pr->pFileReader), &lino, _err);
×
3188

3189
        state->pr->pCurFileSet = state->pFileSet;
×
3190

3191
        code = loadDataTomb(state->pr, state->pr->pFileReader);
×
3192
        if (code != TSDB_CODE_SUCCESS) {
×
3193
          tsdbError("vgId:%d, %s load tomb failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
3194
                    tstrerror(code));
3195
          TAOS_CHECK_GOTO(code, &lino, _err);
×
3196
        }
3197

3198
        TAOS_CHECK_GOTO(tsdbDataFileReadBrinBlk(state->pr->pFileReader, &state->pr->pBlkArray), &lino, _err);
×
3199
      }
3200

3201
      if (!state->pIndexList) {
×
3202
        state->pIndexList = taosArrayInit(1, sizeof(SBrinBlk));
×
3203
        if (!state->pIndexList) {
×
3204
          TAOS_CHECK_GOTO(terrno, &lino, _err);
×
3205
        }
3206
      } else {
3207
        taosArrayClear(state->pIndexList);
×
3208
      }
3209

3210
      const TBrinBlkArray *pBlkArray = state->pr->pBlkArray;
×
3211

3212
      for (int i = TARRAY2_SIZE(pBlkArray) - 1; i >= 0; --i) {
×
3213
        SBrinBlk *pBrinBlk = &pBlkArray->data[i];
×
3214
        if (state->suid >= pBrinBlk->minTbid.suid && state->suid <= pBrinBlk->maxTbid.suid) {
×
3215
          if (state->uid >= pBrinBlk->minTbid.uid && state->uid <= pBrinBlk->maxTbid.uid) {
×
3216
            if (!taosArrayPush(state->pIndexList, pBrinBlk)) {
×
3217
              TAOS_CHECK_GOTO(terrno, &lino, _err);
×
3218
            }
3219
          }
3220
        } else if (state->suid > pBrinBlk->maxTbid.suid ||
×
3221
                   (state->suid == pBrinBlk->maxTbid.suid && state->uid > pBrinBlk->maxTbid.uid)) {
×
3222
          break;
3223
        }
3224
      }
3225

3226
      int indexSize = TARRAY_SIZE(state->pIndexList);
×
3227
      if (indexSize <= 0) {
×
3228
        goto _check_stt_data;
×
3229
      }
3230

3231
      state->state = SFSNEXTROW_INDEXLIST;
×
3232
      state->iBrinIndex = 1;
×
3233
    }
3234

3235
  _check_stt_data:
×
3236
    if (state->pFileSet != state->pr->pCurFileSet) {
×
3237
      state->pr->pCurFileSet = state->pFileSet;
×
3238
    }
3239

3240
    TAOS_CHECK_GOTO(lastIterOpen(&state->lastIter, state->pFileSet, pTsdb, state->pTSchema, state->suid, state->uid,
×
3241
                                 state->pr, state->lastTs, aCols, nCols),
3242
                    &lino, _err);
3243

3244
    TAOS_CHECK_GOTO(lastIterNext(&state->lastIter, &state->pLastRow), &lino, _err);
×
3245

3246
    if (!state->pLastRow) {
×
3247
      state->lastEmpty = 1;
×
3248

3249
      if (SFSNEXTROW_INDEXLIST != state->state) {
×
3250
        clearLastFileSet(state);
×
3251
        goto _next_fileset;
×
3252
      }
3253
    } else {
3254
      state->lastEmpty = 0;
×
3255

3256
      if (SFSNEXTROW_INDEXLIST != state->state) {
×
3257
        state->state = SFSNEXTROW_NEXTSTTROW;
×
3258

3259
        *ppRow = state->pLastRow;
×
3260
        state->pLastRow = NULL;
×
3261

3262
        TAOS_RETURN(code);
×
3263
      }
3264
    }
3265

3266
    state->pLastIter = &state->lastIter;
×
3267
  }
3268

3269
  if (SFSNEXTROW_NEXTSTTROW == state->state) {
×
3270
    TAOS_CHECK_GOTO(lastIterNext(&state->lastIter, &state->pLastRow), &lino, _err);
×
3271

3272
    if (!state->pLastRow) {
×
3273
      if (state->pLastIter) {
×
3274
        code = lastIterClose(&state->pLastIter);
×
3275
        if (code != TSDB_CODE_SUCCESS) {
×
3276
          tsdbError("vgId:%d, %s close last iter failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
3277
                    tstrerror(code));
3278
          TAOS_RETURN(code);
×
3279
        }
3280
      }
3281

3282
      clearLastFileSet(state);
×
3283
      state->state = SFSNEXTROW_FILESET;
×
3284
      goto _next_fileset;
×
3285
    } else {
3286
      *ppRow = state->pLastRow;
×
3287
      state->pLastRow = NULL;
×
3288

3289
      TAOS_RETURN(code);
×
3290
    }
3291
  }
3292

3293
  if (SFSNEXTROW_INDEXLIST == state->state) {
×
3294
    SBrinBlk *pBrinBlk = NULL;
×
3295
  _next_brinindex:
×
3296
    if (--state->iBrinIndex < 0) {
×
3297
      if (state->pLastRow) {
×
3298
        state->state = SFSNEXTROW_NEXTSTTROW;
×
3299
        *ppRow = state->pLastRow;
×
3300
        state->pLastRow = NULL;
×
3301
        return code;
×
3302
      }
3303

3304
      clearLastFileSet(state);
×
3305
      goto _next_fileset;
×
3306
    } else {
3307
      pBrinBlk = taosArrayGet(state->pIndexList, state->iBrinIndex);
×
3308
    }
3309

3310
    if (!state->pBrinBlock) {
×
3311
      state->pBrinBlock = &state->brinBlock;
×
3312
    } else {
3313
      tBrinBlockClear(&state->brinBlock);
×
3314
    }
3315

3316
    TAOS_CHECK_GOTO(tsdbDataFileReadBrinBlock(state->pr->pFileReader, pBrinBlk, &state->brinBlock), &lino, _err);
×
3317

3318
    state->iBrinRecord = state->brinBlock.numOfRecords - 1;
×
3319
    state->state = SFSNEXTROW_BRINBLOCK;
×
3320
  }
3321

3322
  if (SFSNEXTROW_BRINBLOCK == state->state) {
×
3323
  _next_brinrecord:
×
3324
    if (state->iBrinRecord < 0) {  // empty brin block, goto _next_brinindex
×
3325
      tBrinBlockClear(&state->brinBlock);
×
3326
      goto _next_brinindex;
×
3327
    }
3328

3329
    TAOS_CHECK_GOTO(tBrinBlockGet(&state->brinBlock, state->iBrinRecord, &state->brinRecord), &lino, _err);
×
3330

3331
    SBrinRecord *pRecord = &state->brinRecord;
×
3332
    if (pRecord->uid != state->uid) {
×
3333
      // TODO: goto next brin block early
3334
      --state->iBrinRecord;
×
3335
      goto _next_brinrecord;
×
3336
    }
3337

3338
    state->state = SFSNEXTROW_BRINRECORD;
×
3339
  }
3340

3341
  if (SFSNEXTROW_BRINRECORD == state->state) {
×
3342
    SBrinRecord *pRecord = &state->brinRecord;
×
3343

3344
    if (!state->pBlockData) {
×
3345
      state->pBlockData = &state->blockData;
×
3346

3347
      TAOS_CHECK_GOTO(tBlockDataCreate(&state->blockData), &lino, _err);
×
3348
    } else {
3349
      tBlockDataReset(state->pBlockData);
×
3350
    }
3351

3352
    if (aCols[0] == PRIMARYKEY_TIMESTAMP_COL_ID) {
×
3353
      --nCols;
×
3354
      ++aCols;
×
3355
    }
3356

3357
    TAOS_CHECK_GOTO(tsdbDataFileReadBlockDataByColumn(state->pr->pFileReader, pRecord, state->pBlockData,
×
3358
                                                      state->pTSchema, aCols, nCols),
3359
                    &lino, _err);
3360

3361
    state->nRow = state->blockData.nRow;
×
3362
    state->iRow = state->nRow - 1;
×
3363

3364
    state->state = SFSNEXTROW_BLOCKROW;
×
3365
  }
3366

3367
  if (SFSNEXTROW_BLOCKROW == state->state) {
×
3368
    if (state->iRow < 0) {
×
3369
      --state->iBrinRecord;
×
3370
      goto _next_brinrecord;
×
3371
    }
3372

3373
    state->row = tsdbRowFromBlockData(state->pBlockData, state->iRow);
×
3374
    if (!state->pLastIter) {
×
3375
      *ppRow = &state->row;
×
3376
      --state->iRow;
×
3377
      return code;
×
3378
    }
3379

3380
    if (!state->pLastRow) {
×
3381
      // get next row from fslast and process with fs row, --state->Row if select fs row
3382
      TAOS_CHECK_GOTO(lastIterNext(&state->lastIter, &state->pLastRow), &lino, _err);
×
3383
    }
3384

3385
    if (!state->pLastRow) {
×
3386
      if (state->pLastIter) {
×
3387
        code = lastIterClose(&state->pLastIter);
×
3388
        if (code != TSDB_CODE_SUCCESS) {
×
3389
          tsdbError("vgId:%d, %s close last iter failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
3390
                    tstrerror(code));
3391
          TAOS_RETURN(code);
×
3392
        }
3393
      }
3394

3395
      *ppRow = &state->row;
×
3396
      --state->iRow;
×
3397
      return code;
×
3398
    }
3399

3400
    // process state->pLastRow & state->row
3401
    TSKEY rowTs = TSDBROW_TS(&state->row);
×
3402
    TSKEY lastRowTs = TSDBROW_TS(state->pLastRow);
×
3403
    if (lastRowTs > rowTs) {
×
3404
      *ppRow = state->pLastRow;
×
3405
      state->pLastRow = NULL;
×
3406

3407
      TAOS_RETURN(code);
×
3408
    } else if (lastRowTs < rowTs) {
×
3409
      *ppRow = &state->row;
×
3410
      --state->iRow;
×
3411

3412
      TAOS_RETURN(code);
×
3413
    } else {
3414
      // TODO: merge rows and *ppRow = mergedRow
3415
      SRowMerger *pMerger = &state->rowMerger;
×
3416
      code = tsdbRowMergerInit(pMerger, state->pTSchema);
×
3417
      if (code != TSDB_CODE_SUCCESS) {
×
3418
        tsdbError("vgId:%d, %s init row merger failed at line %d since %s", TD_VID(pTsdb->pVnode), __func__, __LINE__,
×
3419
                  tstrerror(code));
3420
        TAOS_RETURN(code);
×
3421
      }
3422

3423
      TAOS_CHECK_GOTO(tsdbRowMergerAdd(pMerger, &state->row, state->pTSchema), &lino, _err);
×
3424
      TAOS_CHECK_GOTO(tsdbRowMergerAdd(pMerger, state->pLastRow, state->pTSchema), &lino, _err);
×
3425

3426
      if (state->pTSRow) {
×
3427
        taosMemoryFree(state->pTSRow);
×
3428
        state->pTSRow = NULL;
×
3429
      }
3430

3431
      TAOS_CHECK_GOTO(tsdbRowMergerGetRow(pMerger, &state->pTSRow), &lino, _err);
×
3432

3433
      state->row = tsdbRowFromTSRow(TSDBROW_VERSION(&state->row), state->pTSRow);
×
3434
      *ppRow = &state->row;
×
3435
      --state->iRow;
×
3436

3437
      tsdbRowMergerClear(pMerger);
×
3438

3439
      TAOS_RETURN(code);
×
3440
    }
3441
  }
3442

3443
_err:
×
3444
  clearLastFileSet(state);
×
3445

3446
  *ppRow = NULL;
×
3447

3448
  if (code) {
×
3449
    tsdbError("tsdb/cache: vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, lino,
×
3450
              tstrerror(code));
3451
  }
3452

3453
  TAOS_RETURN(code);
×
3454
}
3455

3456
typedef struct CacheNextRowIter {
3457
  SArray           *pMemDelData;
3458
  SArray           *pSkyline;
3459
  int64_t           iSkyline;
3460
  SBlockIdx         idx;
3461
  SMemNextRowIter   memState;
3462
  SMemNextRowIter   imemState;
3463
  SFSNextRowIter    fsState;
3464
  TSDBROW           memRow, imemRow, fsLastRow, fsRow;
3465
  TsdbNextRowState  input[3];
3466
  SCacheRowsReader *pr;
3467
  STsdb            *pTsdb;
3468
} CacheNextRowIter;
3469

3470
int32_t clearNextRowFromFS(void *iter) {
×
3471
  int32_t code = 0;
×
3472

3473
  SFSNextRowIter *state = (SFSNextRowIter *)iter;
×
3474
  if (!state) {
×
3475
    TAOS_RETURN(code);
×
3476
  }
3477

3478
  if (state->pLastIter) {
×
3479
    code = lastIterClose(&state->pLastIter);
×
3480
    if (code != TSDB_CODE_SUCCESS) {
×
3481
      tsdbError("%s close last iter failed at line %d since %s", __func__, __LINE__, tstrerror(code));
×
3482
      TAOS_RETURN(code);
×
3483
    }
3484
  }
3485

3486
  if (state->pBlockData) {
×
3487
    tBlockDataDestroy(state->pBlockData);
×
3488
    state->pBlockData = NULL;
×
3489
  }
3490

3491
  if (state->pBrinBlock) {
×
3492
    tBrinBlockDestroy(state->pBrinBlock);
×
3493
    state->pBrinBlock = NULL;
×
3494
  }
3495

3496
  if (state->pIndexList) {
×
3497
    taosArrayDestroy(state->pIndexList);
×
3498
    state->pIndexList = NULL;
×
3499
  }
3500

3501
  if (state->pTSRow) {
×
3502
    taosMemoryFree(state->pTSRow);
×
3503
    state->pTSRow = NULL;
×
3504
  }
3505

3506
  if (state->pRowIter->pSkyline) {
×
3507
    taosArrayDestroy(state->pRowIter->pSkyline);
×
3508
    state->pRowIter->pSkyline = NULL;
×
3509
  }
3510

3511
  TAOS_RETURN(code);
×
3512
}
3513

3514
static void clearLastFileSet(SFSNextRowIter *state) {
×
3515
  if (state->pLastIter) {
×
3516
    int code = lastIterClose(&state->pLastIter);
×
3517
    if (code != TSDB_CODE_SUCCESS) {
×
3518
      tsdbError("%s close last iter failed at line %d since %s", __func__, __LINE__, tstrerror(code));
×
3519
      return;
×
3520
    }
3521
  }
3522

3523
  if (state->pBlockData) {
×
3524
    tBlockDataDestroy(state->pBlockData);
×
3525
    state->pBlockData = NULL;
×
3526
  }
3527

3528
  if (state->pr->pFileReader) {
×
3529
    tsdbDataFileReaderClose(&state->pr->pFileReader);
×
3530
    state->pr->pFileReader = NULL;
×
3531

3532
    state->pr->pCurFileSet = NULL;
×
3533
  }
3534

3535
  if (state->pTSRow) {
×
3536
    taosMemoryFree(state->pTSRow);
×
3537
    state->pTSRow = NULL;
×
3538
  }
3539

3540
  if (state->pRowIter->pSkyline) {
×
3541
    taosArrayDestroy(state->pRowIter->pSkyline);
×
3542
    state->pRowIter->pSkyline = NULL;
×
3543

3544
    void   *pe = NULL;
×
3545
    int32_t iter = 0;
×
3546
    while ((pe = tSimpleHashIterate(state->pr->pTableMap, pe, &iter)) != NULL) {
×
3547
      STableLoadInfo *pInfo = *(STableLoadInfo **)pe;
×
3548
      taosArrayDestroy(pInfo->pTombData);
×
3549
      pInfo->pTombData = NULL;
×
3550
    }
3551
  }
3552
}
3553

3554
static int32_t nextRowIterOpen(CacheNextRowIter *pIter, tb_uid_t uid, STsdb *pTsdb, STSchema *pTSchema, tb_uid_t suid,
×
3555
                               SArray *pLDataIterArray, STsdbReadSnap *pReadSnap, int64_t lastTs,
3556
                               SCacheRowsReader *pr) {
3557
  int32_t code = 0, lino = 0;
×
3558

3559
  STbData *pMem = NULL;
×
3560
  if (pReadSnap->pMem) {
×
3561
    pMem = tsdbGetTbDataFromMemTable(pReadSnap->pMem, suid, uid);
×
3562
  }
3563

3564
  STbData *pIMem = NULL;
×
3565
  if (pReadSnap->pIMem) {
×
3566
    pIMem = tsdbGetTbDataFromMemTable(pReadSnap->pIMem, suid, uid);
×
3567
  }
3568

3569
  pIter->pTsdb = pTsdb;
×
3570

3571
  pIter->pMemDelData = NULL;
×
3572

3573
  TAOS_CHECK_GOTO(loadMemTombData(&pIter->pMemDelData, pMem, pIMem, pr->info.verRange.maxVer), &lino, _err);
×
3574

3575
  pIter->idx = (SBlockIdx){.suid = suid, .uid = uid};
×
3576

3577
  pIter->fsState.pRowIter = pIter;
×
3578
  pIter->fsState.state = SFSNEXTROW_FS;
×
3579
  pIter->fsState.aDFileSet = pReadSnap->pfSetArray;
×
3580
  pIter->fsState.pBlockIdxExp = &pIter->idx;
×
3581
  pIter->fsState.pTSchema = pTSchema;
×
3582
  pIter->fsState.suid = suid;
×
3583
  pIter->fsState.uid = uid;
×
3584
  pIter->fsState.lastTs = lastTs;
×
3585
  pIter->fsState.pr = pr;
×
3586

3587
  pIter->input[0] = (TsdbNextRowState){&pIter->memRow, true, false, false, &pIter->memState, getNextRowFromMem, NULL};
×
3588
  pIter->input[1] = (TsdbNextRowState){&pIter->imemRow, true, false, false, &pIter->imemState, getNextRowFromMem, NULL};
×
3589
  pIter->input[2] =
×
3590
      (TsdbNextRowState){&pIter->fsRow, false, true, false, &pIter->fsState, getNextRowFromFS, clearNextRowFromFS};
×
3591

3592
  if (pMem) {
×
3593
    pIter->memState.pMem = pMem;
×
3594
    pIter->memState.state = SMEMNEXTROW_ENTER;
×
3595
    pIter->memState.lastTs = lastTs;
×
3596
    pIter->input[0].stop = false;
×
3597
    pIter->input[0].next = true;
×
3598
  }
3599

3600
  if (pIMem) {
×
3601
    pIter->imemState.pMem = pIMem;
×
3602
    pIter->imemState.state = SMEMNEXTROW_ENTER;
×
3603
    pIter->imemState.lastTs = lastTs;
×
3604
    pIter->input[1].stop = false;
×
3605
    pIter->input[1].next = true;
×
3606
  }
3607

3608
  pIter->pr = pr;
×
3609

3610
_err:
×
3611
  TAOS_RETURN(code);
×
3612
}
3613

3614
static void nextRowIterClose(CacheNextRowIter *pIter) {
×
3615
  for (int i = 0; i < 3; ++i) {
×
3616
    if (pIter->input[i].nextRowClearFn) {
×
3617
      (void)pIter->input[i].nextRowClearFn(pIter->input[i].iter);
×
3618
    }
3619
  }
3620

3621
  if (pIter->pSkyline) {
×
3622
    taosArrayDestroy(pIter->pSkyline);
×
3623
  }
3624

3625
  if (pIter->pMemDelData) {
×
3626
    taosArrayDestroy(pIter->pMemDelData);
×
3627
  }
3628
}
×
3629

3630
// iterate next row non deleted backward ts, version (from high to low)
3631
static int32_t nextRowIterGet(CacheNextRowIter *pIter, TSDBROW **ppRow, bool *pIgnoreEarlierTs, bool isLast,
×
3632
                              int16_t *aCols, int nCols) {
3633
  int32_t code = 0, lino = 0;
×
3634

3635
  for (;;) {
×
3636
    for (int i = 0; i < 3; ++i) {
×
3637
      if (pIter->input[i].next && !pIter->input[i].stop) {
×
3638
        TAOS_CHECK_GOTO(pIter->input[i].nextRowFn(pIter->input[i].iter, &pIter->input[i].pRow,
×
3639
                                                  &pIter->input[i].ignoreEarlierTs, isLast, aCols, nCols),
3640
                        &lino, _err);
3641

3642
        if (pIter->input[i].pRow == NULL) {
×
3643
          pIter->input[i].stop = true;
×
3644
          pIter->input[i].next = false;
×
3645
        }
3646
      }
3647
    }
3648

3649
    if (pIter->input[0].stop && pIter->input[1].stop && pIter->input[2].stop) {
×
3650
      *ppRow = NULL;
×
3651
      *pIgnoreEarlierTs =
×
3652
          (pIter->input[0].ignoreEarlierTs || pIter->input[1].ignoreEarlierTs || pIter->input[2].ignoreEarlierTs);
×
3653

3654
      TAOS_RETURN(code);
×
3655
    }
3656

3657
    // select maxpoint(s) from mem, imem, fs and last
3658
    TSDBROW *max[4] = {0};
×
3659
    int      iMax[4] = {-1, -1, -1, -1};
×
3660
    int      nMax = 0;
×
3661
    SRowKey  maxKey = {.ts = TSKEY_MIN};
×
3662

3663
    for (int i = 0; i < 3; ++i) {
×
3664
      if (!pIter->input[i].stop && pIter->input[i].pRow != NULL) {
×
3665
        STsdbRowKey tsdbRowKey = {0};
×
3666
        tsdbRowGetKey(pIter->input[i].pRow, &tsdbRowKey);
×
3667

3668
        // merging & deduplicating on client side
3669
        int c = tRowKeyCompare(&maxKey, &tsdbRowKey.key);
×
3670
        if (c <= 0) {
×
3671
          if (c < 0) {
×
3672
            nMax = 0;
×
3673
            maxKey = tsdbRowKey.key;
×
3674
          }
3675

3676
          iMax[nMax] = i;
×
3677
          max[nMax++] = pIter->input[i].pRow;
×
3678
        }
3679
        pIter->input[i].next = false;
×
3680
      }
3681
    }
3682

3683
    // delete detection
3684
    TSDBROW *merge[4] = {0};
×
3685
    int      iMerge[4] = {-1, -1, -1, -1};
×
3686
    int      nMerge = 0;
×
3687
    for (int i = 0; i < nMax; ++i) {
×
3688
      TSDBKEY maxKey1 = TSDBROW_KEY(max[i]);
×
3689

3690
      if (!pIter->pSkyline) {
×
3691
        pIter->pSkyline = taosArrayInit(32, sizeof(TSDBKEY));
×
3692
        TSDB_CHECK_NULL(pIter->pSkyline, code, lino, _err, terrno);
×
3693

3694
        uint64_t        uid = pIter->idx.uid;
×
3695
        STableLoadInfo *pInfo = getTableLoadInfo(pIter->pr, uid);
×
3696
        TSDB_CHECK_NULL(pInfo, code, lino, _err, TSDB_CODE_OUT_OF_MEMORY);
×
3697

3698
        if (pInfo->pTombData == NULL) {
×
3699
          pInfo->pTombData = taosArrayInit(4, sizeof(SDelData));
×
3700
          TSDB_CHECK_NULL(pInfo->pTombData, code, lino, _err, terrno);
×
3701
        }
3702

3703
        if (!taosArrayAddAll(pInfo->pTombData, pIter->pMemDelData)) {
×
3704
          TAOS_CHECK_GOTO(terrno, &lino, _err);
×
3705
        }
3706

3707
        size_t delSize = TARRAY_SIZE(pInfo->pTombData);
×
3708
        if (delSize > 0) {
×
3709
          code = tsdbBuildDeleteSkyline(pInfo->pTombData, 0, (int32_t)(delSize - 1), pIter->pSkyline);
×
3710
          TAOS_CHECK_GOTO(code, &lino, _err);
×
3711
        }
3712
        pIter->iSkyline = taosArrayGetSize(pIter->pSkyline) - 1;
×
3713
      }
3714

3715
      bool deleted = tsdbKeyDeleted(&maxKey1, pIter->pSkyline, &pIter->iSkyline);
×
3716
      if (!deleted) {
×
3717
        iMerge[nMerge] = iMax[i];
×
3718
        merge[nMerge++] = max[i];
×
3719
      }
3720

3721
      pIter->input[iMax[i]].next = deleted;
×
3722
    }
3723

3724
    if (nMerge > 0) {
×
3725
      pIter->input[iMerge[0]].next = true;
×
3726

3727
      *ppRow = merge[0];
×
3728

3729
      TAOS_RETURN(code);
×
3730
    }
3731
  }
3732

3733
_err:
×
3734
  if (code) {
×
3735
    tsdbError("tsdb/cache: %s failed at line %d since %s.", __func__, lino, tstrerror(code));
×
3736
  }
3737

3738
  TAOS_RETURN(code);
×
3739
}
3740

3741
static int32_t initLastColArrayPartial(STSchema *pTSchema, SArray **ppColArray, int16_t *slotIds, int nCols) {
×
3742
  SArray *pColArray = taosArrayInit(nCols, sizeof(SLastCol));
×
3743
  if (NULL == pColArray) {
×
3744
    TAOS_RETURN(terrno);
×
3745
  }
3746

3747
  for (int32_t i = 0; i < nCols; ++i) {
×
3748
    int16_t  slotId = slotIds[i];
×
3749
    SLastCol col = {.rowKey.ts = 0,
×
3750
                    .colVal = COL_VAL_NULL(pTSchema->columns[slotId].colId, pTSchema->columns[slotId].type)};
×
3751
    if (!taosArrayPush(pColArray, &col)) {
×
3752
      TAOS_RETURN(terrno);
×
3753
    }
3754
  }
3755
  *ppColArray = pColArray;
×
3756

3757
  TAOS_RETURN(TSDB_CODE_SUCCESS);
×
3758
}
3759

3760
static int32_t mergeLastCid(tb_uid_t uid, STsdb *pTsdb, SArray **ppLastArray, SCacheRowsReader *pr, int16_t *aCols,
×
3761
                            int nCols, int16_t *slotIds) {
3762
  int32_t   code = 0, lino = 0;
×
3763
  STSchema *pTSchema = pr->pSchema;  // metaGetTbTSchema(pTsdb->pVnode->pMeta, uid, -1, 1);
×
3764
  int16_t   nLastCol = nCols;
×
3765
  int16_t   noneCol = 0;
×
3766
  bool      setNoneCol = false;
×
3767
  bool      hasRow = false;
×
3768
  bool      ignoreEarlierTs = false;
×
3769
  SArray   *pColArray = NULL;
×
3770
  SColVal  *pColVal = &(SColVal){0};
×
3771

3772
  TAOS_CHECK_RETURN(initLastColArrayPartial(pTSchema, &pColArray, slotIds, nCols));
×
3773

3774
  SArray *aColArray = taosArrayInit(nCols, sizeof(int16_t));
×
3775
  if (NULL == aColArray) {
×
3776
    taosArrayDestroy(pColArray);
×
3777

3778
    TAOS_RETURN(terrno);
×
3779
  }
3780

3781
  for (int i = 0; i < nCols; ++i) {
×
3782
    if (!taosArrayPush(aColArray, &aCols[i])) {
×
3783
      taosArrayDestroy(pColArray);
×
3784

3785
      TAOS_RETURN(terrno);
×
3786
    }
3787
  }
3788

3789
  STsdbRowKey lastRowKey = {.key.ts = TSKEY_MAX};
×
3790

3791
  // inverse iterator
3792
  CacheNextRowIter iter = {0};
×
3793
  code =
3794
      nextRowIterOpen(&iter, uid, pTsdb, pTSchema, pr->info.suid, pr->pLDataIterArray, pr->pReadSnap, pr->lastTs, pr);
×
3795
  TAOS_CHECK_GOTO(code, &lino, _err);
×
3796

3797
  do {
3798
    TSDBROW *pRow = NULL;
×
3799
    code = nextRowIterGet(&iter, &pRow, &ignoreEarlierTs, true, TARRAY_DATA(aColArray), TARRAY_SIZE(aColArray));
×
3800

3801
    if (!pRow) {
×
3802
      break;
×
3803
    }
3804

3805
    hasRow = true;
×
3806

3807
    int32_t sversion = TSDBROW_SVERSION(pRow);
×
3808
    if (sversion != -1) {
×
3809
      TAOS_CHECK_GOTO(updateTSchema(sversion, pr, uid), &lino, _err);
×
3810

3811
      pTSchema = pr->pCurrSchema;
×
3812
    }
3813
    // int16_t nCol = pTSchema->numOfCols;
3814

3815
    STsdbRowKey rowKey = {0};
×
3816
    tsdbRowGetKey(pRow, &rowKey);
×
3817

3818
    if (lastRowKey.key.ts == TSKEY_MAX) {  // first time
×
3819
      lastRowKey = rowKey;
×
3820

3821
      for (int16_t iCol = noneCol; iCol < nCols; ++iCol) {
×
3822
        if (iCol >= nLastCol) {
×
3823
          break;
×
3824
        }
3825
        SLastCol *pCol = taosArrayGet(pColArray, iCol);
×
3826
        if (slotIds[iCol] > pTSchema->numOfCols - 1) {
×
3827
          if (!setNoneCol) {
×
3828
            noneCol = iCol;
×
3829
            setNoneCol = true;
×
3830
          }
3831
          continue;
×
3832
        }
3833
        if (pCol->colVal.cid != pTSchema->columns[slotIds[iCol]].colId) {
×
3834
          continue;
×
3835
        }
3836
        if (slotIds[iCol] == 0) {
×
3837
          STColumn *pTColumn = &pTSchema->columns[0];
×
3838
          *pColVal = COL_VAL_VALUE(pTColumn->colId, ((SValue){.type = pTColumn->type, .val = rowKey.key.ts}));
×
3839

3840
          SLastCol colTmp = {.rowKey = rowKey.key, .colVal = *pColVal, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
3841
          TAOS_CHECK_GOTO(tsdbCacheReallocSLastCol(&colTmp, NULL), &lino, _err);
×
3842

3843
          taosArraySet(pColArray, 0, &colTmp);
×
3844
          continue;
×
3845
        }
3846
        tsdbRowGetColVal(pRow, pTSchema, slotIds[iCol], pColVal);
×
3847

3848
        *pCol = (SLastCol){.rowKey = rowKey.key, .colVal = *pColVal, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
3849
        TAOS_CHECK_GOTO(tsdbCacheReallocSLastCol(pCol, NULL), &lino, _err);
×
3850

3851
        if (!COL_VAL_IS_VALUE(pColVal)) {
×
3852
          if (!setNoneCol) {
×
3853
            noneCol = iCol;
×
3854
            setNoneCol = true;
×
3855
          }
3856
        } else {
3857
          int32_t aColIndex = taosArraySearchIdx(aColArray, &pColVal->cid, compareInt16Val, TD_EQ);
×
3858
          if (aColIndex >= 0) {
×
3859
            taosArrayRemove(aColArray, aColIndex);
×
3860
          }
3861
        }
3862
      }
3863
      if (!setNoneCol) {
×
3864
        // done, goto return pColArray
3865
        break;
×
3866
      } else {
3867
        continue;
×
3868
      }
3869
    }
3870

3871
    // merge into pColArray
3872
    setNoneCol = false;
×
3873
    for (int16_t iCol = noneCol; iCol < nCols; ++iCol) {
×
3874
      if (iCol >= nLastCol) {
×
3875
        break;
×
3876
      }
3877
      // high version's column value
3878
      if (slotIds[iCol] > pTSchema->numOfCols - 1) {
×
3879
        continue;
×
3880
      }
3881

3882
      SLastCol *lastColVal = (SLastCol *)taosArrayGet(pColArray, iCol);
×
3883
      if (lastColVal->colVal.cid != pTSchema->columns[slotIds[iCol]].colId) {
×
3884
        continue;
×
3885
      }
3886
      SColVal *tColVal = &lastColVal->colVal;
×
3887
      if (COL_VAL_IS_VALUE(tColVal)) continue;
×
3888

3889
      tsdbRowGetColVal(pRow, pTSchema, slotIds[iCol], pColVal);
×
3890
      if (COL_VAL_IS_VALUE(pColVal)) {
×
3891
        SLastCol lastCol = {.rowKey = rowKey.key, .colVal = *pColVal, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
3892
        TAOS_CHECK_GOTO(tsdbCacheReallocSLastCol(&lastCol, NULL), &lino, _err);
×
3893

3894
        tsdbCacheFreeSLastColItem(lastColVal);
×
3895
        taosArraySet(pColArray, iCol, &lastCol);
×
3896
        int32_t aColIndex = taosArraySearchIdx(aColArray, &lastCol.colVal.cid, compareInt16Val, TD_EQ);
×
3897
        if (aColIndex >= 0) {
×
3898
          taosArrayRemove(aColArray, aColIndex);
×
3899
        }
3900
      } else if (!COL_VAL_IS_VALUE(pColVal) && !setNoneCol) {
×
3901
        noneCol = iCol;
×
3902
        setNoneCol = true;
×
3903
      }
3904
    }
3905
  } while (setNoneCol);
×
3906

3907
  if (!hasRow) {
×
3908
    if (ignoreEarlierTs) {
×
3909
      taosArrayDestroy(pColArray);
×
3910
      pColArray = NULL;
×
3911
    } else {
3912
      taosArrayClear(pColArray);
×
3913
    }
3914
  }
3915
  *ppLastArray = pColArray;
×
3916

3917
  nextRowIterClose(&iter);
×
3918
  taosArrayDestroy(aColArray);
×
3919

3920
  TAOS_RETURN(code);
×
3921

3922
_err:
×
3923
  nextRowIterClose(&iter);
×
3924
  // taosMemoryFreeClear(pTSchema);
3925
  *ppLastArray = NULL;
×
3926
  taosArrayDestroyEx(pColArray, tsdbCacheFreeSLastColItem);
×
3927
  taosArrayDestroy(aColArray);
×
3928

3929
  if (code) {
×
3930
    tsdbError("tsdb/cache: vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, lino,
×
3931
              tstrerror(code));
3932
  }
3933

3934
  TAOS_RETURN(code);
×
3935
}
3936

3937
static int32_t mergeLastRowCid(tb_uid_t uid, STsdb *pTsdb, SArray **ppLastArray, SCacheRowsReader *pr, int16_t *aCols,
×
3938
                               int nCols, int16_t *slotIds) {
3939
  int32_t   code = 0, lino = 0;
×
3940
  STSchema *pTSchema = pr->pSchema;  // metaGetTbTSchema(pTsdb->pVnode->pMeta, uid, -1, 1);
×
3941
  int16_t   nLastCol = nCols;
×
3942
  int16_t   noneCol = 0;
×
3943
  bool      setNoneCol = false;
×
3944
  bool      hasRow = false;
×
3945
  bool      ignoreEarlierTs = false;
×
3946
  SArray   *pColArray = NULL;
×
3947
  SColVal  *pColVal = &(SColVal){0};
×
3948

3949
  TAOS_CHECK_RETURN(initLastColArrayPartial(pTSchema, &pColArray, slotIds, nCols));
×
3950

3951
  SArray *aColArray = taosArrayInit(nCols, sizeof(int16_t));
×
3952
  if (NULL == aColArray) {
×
3953
    taosArrayDestroy(pColArray);
×
3954

3955
    TAOS_RETURN(terrno);
×
3956
  }
3957

3958
  for (int i = 0; i < nCols; ++i) {
×
3959
    if (!taosArrayPush(aColArray, &aCols[i])) {
×
3960
      taosArrayDestroy(pColArray);
×
3961

3962
      TAOS_RETURN(terrno);
×
3963
    }
3964
  }
3965

3966
  // inverse iterator
3967
  CacheNextRowIter iter = {0};
×
3968
  code =
3969
      nextRowIterOpen(&iter, uid, pTsdb, pTSchema, pr->info.suid, pr->pLDataIterArray, pr->pReadSnap, pr->lastTs, pr);
×
3970
  TAOS_CHECK_GOTO(code, &lino, _err);
×
3971

3972
  do {
3973
    TSDBROW *pRow = NULL;
×
3974
    code = nextRowIterGet(&iter, &pRow, &ignoreEarlierTs, false, TARRAY_DATA(aColArray), TARRAY_SIZE(aColArray));
×
3975

3976
    if (!pRow) {
×
3977
      break;
×
3978
    }
3979

3980
    hasRow = true;
×
3981

3982
    int32_t sversion = TSDBROW_SVERSION(pRow);
×
3983
    if (sversion != -1) {
×
3984
      TAOS_CHECK_GOTO(updateTSchema(sversion, pr, uid), &lino, _err);
×
3985

3986
      pTSchema = pr->pCurrSchema;
×
3987
    }
3988
    // int16_t nCol = pTSchema->numOfCols;
3989

3990
    STsdbRowKey rowKey = {0};
×
3991
    tsdbRowGetKey(pRow, &rowKey);
×
3992

3993
    for (int16_t iCol = noneCol; iCol < nCols; ++iCol) {
×
3994
      if (iCol >= nLastCol) {
×
3995
        break;
×
3996
      }
3997
      SLastCol *pCol = taosArrayGet(pColArray, iCol);
×
3998
      if (slotIds[iCol] > pTSchema->numOfCols - 1) {
×
3999
        continue;
×
4000
      }
4001
      if (pCol->colVal.cid != pTSchema->columns[slotIds[iCol]].colId) {
×
4002
        continue;
×
4003
      }
4004
      if (slotIds[iCol] == 0) {
×
4005
        STColumn *pTColumn = &pTSchema->columns[0];
×
4006
        *pColVal = COL_VAL_VALUE(pTColumn->colId, ((SValue){.type = pTColumn->type, .val = rowKey.key.ts}));
×
4007

4008
        SLastCol colTmp = {.rowKey = rowKey.key, .colVal = *pColVal, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
4009
        TAOS_CHECK_GOTO(tsdbCacheReallocSLastCol(&colTmp, NULL), &lino, _err);
×
4010

4011
        taosArraySet(pColArray, 0, &colTmp);
×
4012
        continue;
×
4013
      }
4014
      tsdbRowGetColVal(pRow, pTSchema, slotIds[iCol], pColVal);
×
4015

4016
      *pCol = (SLastCol){.rowKey = rowKey.key, .colVal = *pColVal, .cacheStatus = TSDB_LAST_CACHE_VALID};
×
4017
      TAOS_CHECK_GOTO(tsdbCacheReallocSLastCol(pCol, NULL), &lino, _err);
×
4018

4019
      int32_t aColIndex = taosArraySearchIdx(aColArray, &pColVal->cid, compareInt16Val, TD_EQ);
×
4020
      if (aColIndex >= 0) {
×
4021
        taosArrayRemove(aColArray, aColIndex);
×
4022
      }
4023
    }
4024

4025
    break;
×
4026
  } while (1);
4027

4028
  if (!hasRow) {
×
4029
    if (ignoreEarlierTs) {
×
4030
      taosArrayDestroy(pColArray);
×
4031
      pColArray = NULL;
×
4032
    } else {
4033
      taosArrayClear(pColArray);
×
4034
    }
4035
  }
4036
  *ppLastArray = pColArray;
×
4037

4038
  nextRowIterClose(&iter);
×
4039
  taosArrayDestroy(aColArray);
×
4040

4041
  TAOS_RETURN(code);
×
4042

4043
_err:
×
4044
  nextRowIterClose(&iter);
×
4045

4046
  *ppLastArray = NULL;
×
4047
  taosArrayDestroyEx(pColArray, tsdbCacheFreeSLastColItem);
×
4048
  taosArrayDestroy(aColArray);
×
4049

4050
  if (code) {
×
4051
    tsdbError("tsdb/cache: vgId:%d, %s failed at line %d since %s.", TD_VID(pTsdb->pVnode), __func__, lino,
×
4052
              tstrerror(code));
4053
  }
4054

4055
  TAOS_RETURN(code);
×
4056
}
4057

4058
void tsdbCacheRelease(SLRUCache *pCache, LRUHandle *h) { tsdbLRUCacheRelease(pCache, h, false); }
×
4059

4060
void tsdbCacheSetCapacity(SVnode *pVnode, size_t capacity) {
×
4061
  taosLRUCacheSetCapacity(pVnode->pTsdb->lruCache, capacity);
×
4062
}
×
4063

4064
#ifdef BUILD_NO_CALL
4065
size_t tsdbCacheGetCapacity(SVnode *pVnode) { return taosLRUCacheGetCapacity(pVnode->pTsdb->lruCache); }
4066
#endif
4067

4068
size_t tsdbCacheGetUsage(SVnode *pVnode) {
×
4069
  size_t usage = 0;
×
4070
  if (pVnode->pTsdb != NULL) {
×
4071
    usage = taosLRUCacheGetUsage(pVnode->pTsdb->lruCache);
×
4072
  }
4073

4074
  return usage;
×
4075
}
4076

4077
int32_t tsdbCacheGetElems(SVnode *pVnode) {
×
4078
  int32_t elems = 0;
×
4079
  if (pVnode->pTsdb != NULL) {
×
4080
    elems = taosLRUCacheGetElems(pVnode->pTsdb->lruCache);
×
4081
  }
4082

4083
  return elems;
×
4084
}
4085

4086
// block cache
4087
static void getBCacheKey(int32_t fid, int64_t commitID, int64_t blkno, char *key, int *len) {
×
4088
  struct {
4089
    int32_t fid;
4090
    int64_t commitID;
4091
    int64_t blkno;
4092
  } bKey = {0};
×
4093

4094
  bKey.fid = fid;
×
4095
  bKey.commitID = commitID;
×
4096
  bKey.blkno = blkno;
×
4097

4098
  *len = sizeof(bKey);
×
4099
  memcpy(key, &bKey, *len);
×
4100
}
×
4101

4102
static int32_t tsdbCacheLoadBlockS3(STsdbFD *pFD, uint8_t **ppBlock) {
×
4103
  int32_t code = 0;
×
4104

4105
  int64_t block_offset = (pFD->blkno - 1) * tsS3BlockSize * pFD->szPage;
×
4106

4107
  TAOS_CHECK_RETURN(tcsGetObjectBlock(pFD->objName, block_offset, tsS3BlockSize * pFD->szPage, 0, ppBlock));
×
4108

4109
  tsdbTrace("block:%p load from s3", *ppBlock);
×
4110

4111
_exit:
×
4112
  return code;
×
4113
}
4114

4115
static void deleteBCache(const void *key, size_t keyLen, void *value, void *ud) {
×
4116
  (void)ud;
4117
  uint8_t *pBlock = (uint8_t *)value;
×
4118

4119
  taosMemoryFree(pBlock);
×
4120
}
×
4121

4122
int32_t tsdbCacheGetBlockS3(SLRUCache *pCache, STsdbFD *pFD, LRUHandle **handle) {
×
4123
  int32_t code = 0;
×
4124
  char    key[128] = {0};
×
4125
  int     keyLen = 0;
×
4126

4127
  getBCacheKey(pFD->fid, pFD->cid, pFD->blkno, key, &keyLen);
×
4128
  LRUHandle *h = taosLRUCacheLookup(pCache, key, keyLen);
×
4129
  if (!h) {
×
4130
    STsdb *pTsdb = pFD->pTsdb;
×
4131
    (void)taosThreadMutexLock(&pTsdb->bMutex);
×
4132

4133
    h = taosLRUCacheLookup(pCache, key, keyLen);
×
4134
    if (!h) {
×
4135
      uint8_t *pBlock = NULL;
×
4136
      code = tsdbCacheLoadBlockS3(pFD, &pBlock);
×
4137
      //  if table's empty or error, return code of -1
4138
      if (code != TSDB_CODE_SUCCESS || pBlock == NULL) {
×
4139
        (void)taosThreadMutexUnlock(&pTsdb->bMutex);
×
4140

4141
        *handle = NULL;
×
4142
        if (code == TSDB_CODE_SUCCESS && !pBlock) {
×
4143
          code = TSDB_CODE_OUT_OF_MEMORY;
×
4144
        }
4145

4146
        TAOS_RETURN(code);
×
4147
      }
4148

4149
      size_t              charge = tsS3BlockSize * pFD->szPage;
×
4150
      _taos_lru_deleter_t deleter = deleteBCache;
×
4151
      LRUStatus           status =
4152
          taosLRUCacheInsert(pCache, key, keyLen, pBlock, charge, deleter, NULL, &h, TAOS_LRU_PRIORITY_LOW, NULL);
×
4153
      if (status != TAOS_LRU_STATUS_OK) {
4154
        // code = -1;
4155
      }
4156
    }
4157

4158
    (void)taosThreadMutexUnlock(&pTsdb->bMutex);
×
4159
  }
4160

4161
  *handle = h;
×
4162

4163
  TAOS_RETURN(code);
×
4164
}
4165

4166
int32_t tsdbCacheGetPageS3(SLRUCache *pCache, STsdbFD *pFD, int64_t pgno, LRUHandle **handle) {
×
4167
  int32_t code = 0;
×
4168
  char    key[128] = {0};
×
4169
  int     keyLen = 0;
×
4170

4171
  getBCacheKey(pFD->fid, pFD->cid, pgno, key, &keyLen);
×
4172
  *handle = taosLRUCacheLookup(pCache, key, keyLen);
×
4173

4174
  return code;
×
4175
}
4176

4177
void tsdbCacheSetPageS3(SLRUCache *pCache, STsdbFD *pFD, int64_t pgno, uint8_t *pPage) {
×
4178
  char       key[128] = {0};
×
4179
  int        keyLen = 0;
×
4180
  LRUHandle *handle = NULL;
×
4181

4182
  getBCacheKey(pFD->fid, pFD->cid, pgno, key, &keyLen);
×
4183
  (void)taosThreadMutexLock(&pFD->pTsdb->pgMutex);
×
4184
  handle = taosLRUCacheLookup(pFD->pTsdb->pgCache, key, keyLen);
×
4185
  if (!handle) {
×
4186
    size_t              charge = pFD->szPage;
×
4187
    _taos_lru_deleter_t deleter = deleteBCache;
×
4188
    uint8_t            *pPg = taosMemoryMalloc(charge);
×
4189
    if (!pPg) {
×
4190
      return;  // ignore error with s3 cache and leave error untouched
×
4191
    }
4192
    memcpy(pPg, pPage, charge);
×
4193

4194
    LRUStatus status =
4195
        taosLRUCacheInsert(pCache, key, keyLen, pPg, charge, deleter, NULL, &handle, TAOS_LRU_PRIORITY_LOW, NULL);
×
4196
    if (status != TAOS_LRU_STATUS_OK) {
4197
      // ignore cache updating if not ok
4198
      // code = TSDB_CODE_OUT_OF_MEMORY;
4199
    }
4200
  }
4201
  (void)taosThreadMutexUnlock(&pFD->pTsdb->pgMutex);
×
4202

4203
  tsdbCacheRelease(pFD->pTsdb->pgCache, handle);
×
4204
}
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc