• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #4997

20 Mar 2026 06:10AM UTC coverage: 71.739% (-0.3%) from 72.069%
#4997

push

travis-ci

web-flow
feat: add query phase tracking for SHOW QUERIES (#34706)

148 of 183 new or added lines in 10 files covered. (80.87%)

9273 existing lines in 172 files now uncovered.

244572 of 340921 relevant lines covered (71.74%)

133392941.95 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

71.99
/source/libs/executor/src/groupcacheoperator.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15

16
#include "executorInt.h"
17
#include "filter.h"
18
#include "function.h"
19
#include "operator.h"
20
#include "os.h"
21
#include "querynodes.h"
22
#include "querytask.h"
23
#include "tcompare.h"
24
#include "tdatablock.h"
25
#include "thash.h"
26
#include "tmsg.h"
27
#include "ttypes.h"
28
#include "groupcache.h"
29

30

31
static void removeGroupCacheFile(SGroupCacheFileInfo* pFileInfo) {
142,603✔
32
  if (pFileInfo->fd.fd) {
142,603✔
33
    if (taosCloseFile(&pFileInfo->fd.fd) < 0) {
142,603✔
34
      qError("close group cache file failed, fd:%p, error:%s", pFileInfo->fd.fd, tstrerror(terrno));
×
35
    }
36
    pFileInfo->fd.fd = NULL;
142,603✔
37
    (void)taosThreadMutexDestroy(&pFileInfo->fd.mutex);
142,603✔
38
  }
39
  pFileInfo->deleted = true;
142,603✔
40
}
142,603✔
41

42

43
static int32_t initGroupColsInfo(SGroupColsInfo* pCols, bool grpColsMayBeNull, SNodeList* pList) {
×
44
  pCols->colNum = LIST_LENGTH(pList);
×
45
  pCols->withNull = grpColsMayBeNull;  
×
46
  pCols->pColsInfo = taosMemoryMalloc(pCols->colNum * sizeof(SGroupColInfo));
×
47
  if (NULL == pCols->pColsInfo) {
×
48
    return terrno;
×
49
  }
50

51
  int32_t i = 0;
×
52
  SNode* pNode = NULL;
×
53
  FOREACH(pNode, pList) {
×
54
    SColumnNode* pColNode = (SColumnNode*)pNode;
×
55
    pCols->pColsInfo[i].slot = pColNode->slotId;
×
56
    pCols->pColsInfo[i].vardata = IS_VAR_DATA_TYPE(pColNode->node.resType.type);
×
57
    pCols->pColsInfo[i].bytes = pColNode->node.resType.bytes;
×
58
    pCols->bufSize += pColNode->node.resType.bytes;
×
59
    ++i;
×
60
  }  
61

62
  if (pCols->withNull) {
×
63
    pCols->bitMapSize = pCols->colNum / sizeof(int8_t) + ((pCols->colNum % sizeof(int8_t)) ? 1 : 0);
×
64
    pCols->bufSize += pCols->bitMapSize;
×
65
  }
66

67
  if (pCols->colNum > 1) {
×
68
    pCols->pBuf = taosMemoryMalloc(pCols->bufSize);
×
69
    if (NULL == pCols->pBuf) {
×
70
      return terrno;
×
71
    }
72
  }
73

74
  return TSDB_CODE_SUCCESS;
×
75
}
76

77
static void logGroupCacheExecInfo(SGroupCacheOperatorInfo* pGrpCacheOperator) {
1,195,276✔
78
  if (pGrpCacheOperator->downstreamNum <= 0 || NULL == pGrpCacheOperator->execInfo.pDownstreamBlkNum) {
1,195,276✔
79
    return;
×
80
  }
81

82
  int32_t bufSize = pGrpCacheOperator->downstreamNum * 32 + 100;
1,195,276✔
83
  char* buf = taosMemoryMalloc(bufSize);
1,195,276✔
84
  if (NULL == buf) {
1,195,276✔
85
    return;
×
86
  }
87
  int32_t offset = snprintf(buf, bufSize, "groupCache exec info, downstreamBlkNum:");
1,195,276✔
88
  for (int32_t i = 0; i < pGrpCacheOperator->downstreamNum; ++i) {
3,585,828✔
89
    offset += snprintf(buf + offset, bufSize - offset, " %" PRId64, pGrpCacheOperator->execInfo.pDownstreamBlkNum[i]);
2,390,552✔
90
  }
91
  qDebug("%s", buf);
1,195,276✔
92
  taosMemoryFree(buf);
1,195,276✔
93
}
94

95
static void freeSGcSessionCtx(void* p) {
7,590,265✔
96
  SGcSessionCtx* pSession = p;
7,590,265✔
97
  if (pSession->semInit) {
7,590,265✔
98
    if (tsem_destroy(&pSession->waitSem) < 0) {
×
99
      qError("tsem_destroy session waitSem failed, error:%s", tstrerror(terrno));
×
100
    }
101
  }
102
}
7,590,265✔
103

104
static void freeSGroupCacheFileInfo(void* p) {
142,603✔
105
  SGroupCacheFileInfo* pFileInfo = p;
142,603✔
106
  if (pFileInfo->deleted) {
142,603✔
107
    return;
×
108
  }
109

110
  removeGroupCacheFile(pFileInfo);
142,603✔
111
}
112

113
static void freeSGcFileCacheCtx(SGcFileCacheCtx* pFileCtx) {
4,787,632✔
114
  taosHashCleanup(pFileCtx->pCacheFile);
4,787,632✔
115
  pFileCtx->pCacheFile = NULL;
4,787,632✔
116
}
4,787,632✔
117

118
static void freeSGcVgroupCtx(void* p) {
2,393,816✔
119
  SGcVgroupCtx* pVgCtx = p;
2,393,816✔
120
  taosArrayDestroy(pVgCtx->pTbList);
2,393,816✔
121
  freeSGcFileCacheCtx(&pVgCtx->fileCtx);
2,393,816✔
122
}
2,393,816✔
123

124
static void freeGcBlockInList(void* p) {
3,703,138✔
125
  SSDataBlock** ppBlock = p;
3,703,138✔
126
  if (*ppBlock) {
3,703,138✔
127
    taosArrayDestroy((*ppBlock)->pDataBlock);
3,703,138✔
128
    taosMemoryFree(*ppBlock);
3,703,138✔
129
  }
130
}
3,703,138✔
131

132
static void freeSGcDownstreamCtx(SGcDownstreamCtx* pCtx) {
2,390,552✔
133
  taosArrayDestroy(pCtx->pNewGrpList);
2,390,552✔
134
  taosHashCleanup(pCtx->pGrpHash);
2,390,552✔
135
  tSimpleHashCleanup(pCtx->pVgTbHash);
2,390,552✔
136

137
  taosArrayDestroyEx(pCtx->pFreeBlock, freeGcBlockInList);
2,390,552✔
138
  taosHashCleanup(pCtx->pSessions);
2,390,552✔
139
  taosHashCleanup(pCtx->pWaitSessions);
2,390,552✔
140
  freeSGcFileCacheCtx(&pCtx->fileCtx);
2,390,552✔
141
}
2,390,552✔
142

143
static void destroyGroupCacheDownstreamCtx(SGroupCacheOperatorInfo* pGrpCacheOperator) {
1,195,276✔
144
  if (NULL == pGrpCacheOperator->pDownstreams) {
1,195,276✔
145
    return;
×
146
  }
147
  
148
  for (int32_t i = 0; i < pGrpCacheOperator->downstreamNum; ++i) {
3,585,828✔
149
    SGcDownstreamCtx* pCtx = &pGrpCacheOperator->pDownstreams[i];
2,390,552✔
150
    freeSGcDownstreamCtx(pCtx);
2,390,552✔
151
  }
152

153
  taosMemoryFree(pGrpCacheOperator->pDownstreams);
1,195,276✔
154
}
155

156

157
void blockDataDeepCleanup(SSDataBlock* pDataBlock) {
7,422,654✔
158
  size_t numOfCols = taosArrayGetSize(pDataBlock->pDataBlock);
7,422,654✔
159
  for (int32_t i = 0; i < numOfCols; ++i) {
28,263,027✔
160
    SColumnInfoData* p = taosArrayGet(pDataBlock->pDataBlock, i);
20,840,373✔
161
    if (NULL == p) {
20,840,373✔
162
      qError("fail to get %dth col in dataBlock, numOfCols:%d", i, (int32_t)numOfCols);
×
163
      continue;
×
164
    }
165
    taosMemoryFreeClear(p->pData);
20,840,373✔
166
    if (IS_VAR_DATA_TYPE(p->info.type)) {
20,840,373✔
167
      taosMemoryFreeClear(p->varmeta.offset);
196,566✔
168
      p->varmeta.length = 0;
196,566✔
169
      p->varmeta.allocLen = 0;
196,566✔
170
    } else {
171
      taosMemoryFreeClear(p->nullbitmap);
20,643,807✔
172
    }
173
  }
174
  pDataBlock->info.capacity = 0;
7,422,654✔
175
  pDataBlock->info.rows = 0;
7,422,654✔
176
}
7,422,654✔
177

178

179

180
static void destroySGcBlkCacheInfo(SGcBlkCacheInfo* pBlkCache) {
1,195,276✔
181
  taosHashCleanup(pBlkCache->pDirtyBlk);
1,195,276✔
182

183
  void* p = NULL;
1,195,276✔
184
  while (NULL != (p = taosHashIterate(pBlkCache->pReadBlk, p))) {
4,768,046✔
185
    blockDataDeepCleanup(*(SSDataBlock**)p);
3,572,770✔
186
    freeGcBlockInList(p);
3,572,770✔
187
  }
188

189
  taosHashCleanup(pBlkCache->pReadBlk);
1,195,276✔
190
}
1,195,276✔
191

192
static void destroyGroupCacheOperator(void* param) {
1,195,276✔
193
  SGroupCacheOperatorInfo* pGrpCacheOperator = (SGroupCacheOperatorInfo*)param;
1,195,276✔
194

195
  logGroupCacheExecInfo(pGrpCacheOperator);
1,195,276✔
196
  
197
  taosMemoryFree(pGrpCacheOperator->groupColsInfo.pColsInfo);
1,195,276✔
198
  taosMemoryFree(pGrpCacheOperator->groupColsInfo.pBuf);
1,195,276✔
199

200
  destroyGroupCacheDownstreamCtx(pGrpCacheOperator);
1,195,276✔
201
  destroySGcBlkCacheInfo(&pGrpCacheOperator->blkCache);
1,195,276✔
202
  taosHashCleanup(pGrpCacheOperator->pGrpHash);
1,195,276✔
203

204
  taosMemoryFree(pGrpCacheOperator->execInfo.pDownstreamBlkNum);
1,195,276✔
205
  
206
  taosMemoryFreeClear(param);
1,195,276✔
207
}
1,195,276✔
208

209
static FORCE_INLINE int32_t initOpenCacheFile(SGroupCacheFileFd* pFileFd, char* filename) {
210
  TdFilePtr newFd = taosOpenFile(filename, TD_FILE_CREATE|TD_FILE_READ|TD_FILE_WRITE|TD_FILE_AUTO_DEL);
142,603✔
211
  //TdFilePtr newFd = taosOpenFile(filename, TD_FILE_CREATE|TD_FILE_READ|TD_FILE_WRITE);
212
  if (NULL == newFd) {
142,603✔
213
    QRY_ERR_RET(terrno);
×
214
  }
215
  pFileFd->fd = newFd;
142,603✔
216
  int32_t code = taosThreadMutexInit(&pFileFd->mutex, NULL);
142,603✔
217
  if (code) {
142,603✔
218
    qError("taosThreadMutexInit failed, code:%x", code);
×
219
    QRY_ERR_RET(code);
×
220
  }
221

222
  qTrace("file path %s created", filename);
142,603✔
223
  
224
  return TSDB_CODE_SUCCESS;
142,603✔
225
}
226

227
static int32_t acquireFdFromFileCtx(SGcFileCacheCtx* pFileCtx, int32_t fileId, SGroupCacheFileFd** ppFd, bool* pDeleted) {
8,000,989✔
228
  int32_t code = TSDB_CODE_SUCCESS;
8,000,989✔
229
  if (NULL == pFileCtx->pCacheFile) {
8,000,989✔
230
    pFileCtx->pCacheFile = taosHashInit(10, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT), false, HASH_ENTRY_LOCK);
142,603✔
231
    if (NULL == pFileCtx->pCacheFile) {
142,603✔
232
      return terrno;
×
233
    }
234
    taosHashSetFreeFp(pFileCtx->pCacheFile, freeSGroupCacheFileInfo);
142,603✔
235
  }
236
  
237
  SGroupCacheFileInfo* pTmp = taosHashGet(pFileCtx->pCacheFile, &fileId, sizeof(fileId));
8,000,989✔
238
  if (NULL == pTmp) {
8,000,989✔
239
    (void)snprintf(&pFileCtx->baseFilename[pFileCtx->baseNameLen], sizeof(pFileCtx->baseFilename) - pFileCtx->baseNameLen, "_%d", fileId);
142,603✔
240

241
    SGroupCacheFileInfo newFile = {0};
142,603✔
242
    if (taosHashPut(pFileCtx->pCacheFile, &fileId, sizeof(fileId), &newFile, sizeof(newFile))) {
142,603✔
243
      QRY_ERR_RET(terrno);
×
244
    }
245
    pTmp = taosHashGet(pFileCtx->pCacheFile, &fileId, sizeof(fileId));
142,603✔
246
    if (NULL == pTmp) {
142,603✔
247
      qError("fail to get file %d from pCacheFile", fileId);
×
248
      QRY_ERR_RET(TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
×
249
    }
250
  }
251

252
  if (pTmp->deleted) {
8,000,989✔
253
    *pDeleted = true;
×
254
    return TSDB_CODE_SUCCESS;
×
255
  }
256

257
  if (NULL == pTmp->fd.fd) {
8,000,989✔
258
    code = initOpenCacheFile(&pTmp->fd, pFileCtx->baseFilename);
142,603✔
259
    if (code) {
142,603✔
260
      return code;
×
261
    }
262
  }
263

264
  (void)taosThreadMutexLock(&pTmp->fd.mutex);
8,000,989✔
265
  *ppFd = &pTmp->fd;
8,000,989✔
266
  
267
  return TSDB_CODE_SUCCESS;
8,000,989✔
268
}
269

270
static FORCE_INLINE void releaseFdToFileCtx(SGroupCacheFileFd* pFd) {
271
  if (NULL == pFd) {
8,000,989✔
272
    return;
×
273
  }
274
  (void)taosThreadMutexUnlock(&pFd->mutex);
8,000,989✔
275
}
276

277
static int32_t saveBlocksToDisk(SGroupCacheOperatorInfo* pGCache, SGcDownstreamCtx* pCtx, SGcBlkBufInfo* pHead) {
578,335✔
278
  int32_t code = TSDB_CODE_SUCCESS;
578,335✔
279
  SGroupCacheFileFd *pFd = NULL;
578,335✔
280
  SGcFileCacheCtx* pFileCtx = NULL;
578,335✔
281
  SHashObj* pGrpHash = pGCache->globalGrp ? pGCache->pGrpHash : pCtx->pGrpHash;
578,335✔
282
  int64_t lastGroupId = 0;
578,335✔
283
  SGroupCacheData* pGroup = NULL;
578,335✔
284
  
285
  while (NULL != pHead) {
1,156,670✔
286
    pFd = NULL;
578,335✔
287
    
288
    if (pGCache->batchFetch) {
578,335✔
289
      pFileCtx = &pHead->pCtx->fileCtx;
578,335✔
290
    } else {
291
      if (pHead->groupId != lastGroupId) {
×
292
        if (NULL != pGroup) {
×
293
          taosHashRelease(pGrpHash, pGroup);
×
294
        }
295
        pGroup = taosHashAcquire(pGrpHash, &pHead->groupId, sizeof(pHead->groupId));      
×
296
        lastGroupId = pHead->groupId;
×
297
      }
298
    
299
      if (NULL == pGroup) {
×
300
        qTrace("group %" PRIu64 " in downstream %d may already be deleted, skip write", pHead->groupId, pHead->pCtx->id);
×
301

302
        int64_t blkId = pHead->basic.blkId;
×
303
        pHead = pHead->next;
×
304
        code = taosHashRemove(pGCache->blkCache.pDirtyBlk, &blkId, sizeof(blkId));
×
305
        if (code) {
×
306
          qError("taosHashRemove blk %" PRId64 " from diryBlk failed, error:%s", blkId, tstrerror(code));
×
307
          goto _return;
×
308
        }
309
        continue;
×
310
      }
311
      
312
      pFileCtx = &pGroup->pVgCtx->fileCtx;
×
313
    }
314

315
    bool deleted = false;
578,335✔
316
    code = acquireFdFromFileCtx(pFileCtx, pHead->basic.fileId, &pFd, &deleted);
578,335✔
317
    if (code) {
578,335✔
318
      goto _return;
×
319
    }
320

321
    if (deleted) {
578,335✔
322
      releaseFdToFileCtx(pFd);
×
323

324
      qTrace("FileId:%d-%d-%d already be deleted, skip write", 
×
325
          pCtx->id, pGroup ? pGroup->vgId : GROUP_CACHE_DEFAULT_VGID, pHead->basic.fileId);
326
      
327
      int64_t blkId = pHead->basic.blkId;
×
328
      pHead = pHead->next;
×
329
      
330
      code = taosHashRemove(pGCache->blkCache.pDirtyBlk, &blkId, sizeof(blkId));
×
331
      if (code) {
×
332
        qError("taosHashRemove blk %" PRId64 " from diryBlk failed, error:%s", blkId, tstrerror(code));
×
333
        goto _return;
×
334
      }
335
      continue;
×
336
    }
337
    
338
    int64_t ret = taosLSeekFile(pFd->fd, pHead->basic.offset, SEEK_SET);
578,335✔
339
    if (ret < 0) {
578,335✔
340
      releaseFdToFileCtx(pFd);
×
341
      code = terrno;
×
342
      goto _return;
×
343
    }
344
    
345
    ret = taosWriteFile(pFd->fd, pHead->pBuf, pHead->basic.bufSize);
578,335✔
346
    if (ret != pHead->basic.bufSize) {
578,335✔
347
      releaseFdToFileCtx(pFd);
×
348
      code = terrno;
×
349
      goto _return;
×
350
    }
351
    
352
    releaseFdToFileCtx(pFd);
578,335✔
353

354
    qTrace("FileId:%d-%d-%d blk %" PRIu64 " in group %" PRIu64 " size %" PRIu64 " written to offset %" PRIu64, 
578,335✔
355
        pCtx->id, pGroup ? pGroup->vgId : GROUP_CACHE_DEFAULT_VGID, pHead->basic.fileId, pHead->basic.blkId, pHead->groupId, pHead->basic.bufSize, pHead->basic.offset);
356
    
357
    int64_t blkId = pHead->basic.blkId;
578,335✔
358
    pHead = pHead->next;
578,335✔
359

360
    code = taosHashRemove(pGCache->blkCache.pDirtyBlk, &blkId, sizeof(blkId));
578,335✔
361
    if (code) {
578,335✔
362
      qError("taosHashRemove blk %" PRId64 " from diryBlk failed, error:%s", blkId, tstrerror(code));
×
363
      goto _return;
×
364
    }
365
  }
366

367
_return:
578,335✔
368

369
  if (NULL != pGroup) {
578,335✔
370
    taosHashRelease(pGrpHash, pGroup);
×
371
  }
372

373
  (void)atomic_val_compare_exchange_32(&pGCache->blkCache.writeDownstreamId, pCtx->id, -1);
578,335✔
374

375
  return code;
578,335✔
376
}
377

378

379
void freeGcBlkBufInfo(void* ptr) {
578,335✔
380
  SGcBlkBufInfo* pBlk = (SGcBlkBufInfo*)ptr;
578,335✔
381
  taosMemoryFreeClear(pBlk->pBuf);
578,335✔
382
}
578,335✔
383

384

385
static int32_t addBlkToDirtyBufList(SGroupCacheOperatorInfo* pGCache, SGcDownstreamCtx* pCtx, SGcBlkCacheInfo* pCache, SGcBlkBufInfo* pBufInfo) {
578,335✔
386
  if (0 != taosHashPut(pCache->pDirtyBlk, &pBufInfo->basic.blkId, sizeof(pBufInfo->basic.blkId), pBufInfo, sizeof(*pBufInfo))) {
578,335✔
387
    freeGcBlkBufInfo(pBufInfo);
×
388
    return terrno;
×
389
  }
390
  pBufInfo = taosHashGet(pCache->pDirtyBlk, &pBufInfo->basic.blkId, sizeof(pBufInfo->basic.blkId));
578,335✔
391
  if (NULL == pBufInfo) {
578,335✔
392
    qError("fail to get blk %" PRId64 " from pCache->pDirtyBlk", pBufInfo->basic.blkId);
×
393
    QRY_ERR_RET(TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
×
394
  }
395
  int32_t code = TSDB_CODE_SUCCESS;
578,335✔
396
  SGcBlkBufInfo* pWriteHead = NULL;
578,335✔
397
  
398
  taosWLockLatch(&pCache->dirtyLock);
578,335✔
399
  pCache->blkCacheSize += pBufInfo->basic.bufSize;
578,335✔
400
  qDebug("group cache total dirty block num:%d size:%" PRId64 , taosHashGetSize(pCache->pDirtyBlk), pCache->blkCacheSize);
578,335✔
401

402
  if (NULL == pCache->pDirtyHead) {
578,335✔
403
    pCache->pDirtyHead = pBufInfo;
578,335✔
404
  } else {
405
    pCache->pDirtyTail->next = pBufInfo;
×
406
  }
407
  pCache->pDirtyTail = pBufInfo;
578,335✔
408
    
409
  if (pGCache->maxCacheSize >= 0 && pCache->blkCacheSize > pGCache->maxCacheSize) {
578,335✔
410
    if (-1 == atomic_val_compare_exchange_32(&pCache->writeDownstreamId, -1, pCtx->id)) {
578,335✔
411
      pWriteHead = pCache->pDirtyHead;
578,335✔
412
      SGcBlkBufInfo* pTmp = pCache->pDirtyHead;
578,335✔
413
      while (NULL != pTmp) {
578,335✔
414
        pCache->blkCacheSize -= pTmp->basic.bufSize;
578,335✔
415
        if (pCache->blkCacheSize <= pGCache->maxCacheSize) {
578,335✔
416
          pCache->pDirtyHead = pTmp->next;
578,335✔
417
          pTmp->next = NULL;
578,335✔
418
          break;
578,335✔
419
        }
420
        pTmp = pTmp->next;
×
421
      }
422
    }
423
  }
424
  taosWUnLockLatch(&pCache->dirtyLock);
578,335✔
425

426
  if (NULL != pWriteHead) {
578,335✔
427
    code = saveBlocksToDisk(pGCache, pCtx, pWriteHead);
578,335✔
428
  }
429

430
  return code;
578,335✔
431
}
432

433
static FORCE_INLINE void chkRemoveVgroupCurrFile(SGcFileCacheCtx* pFileCtx, int32_t downstreamIdx, int32_t vgId) {
434
  SGroupCacheFileInfo* pFileInfo = taosHashGet(pFileCtx->pCacheFile, &pFileCtx->fileId, sizeof(pFileCtx->fileId));
×
435
  if (NULL == pFileInfo) {
×
436
    return;
×
437
  }
438
  
439
  if (0 == pFileInfo->groupNum) {
×
440
    removeGroupCacheFile(pFileInfo);
×
441

442
#if 0  
443
    /* debug only */
444
    snprintf(&pFileCtx->baseFilename[pFileCtx->baseNameLen], sizeof(pFileCtx->baseFilename) - pFileCtx->baseNameLen, "_%d", pFileCtx->fileId);
445
    taosRemoveFile(pFileCtx->baseFilename);
446
    /* debug only */
447
#endif
448

449
    qTrace("FileId:%d-%d-%d removed", downstreamIdx, vgId, pFileCtx->fileId);
×
450
    //taosHashRemove(pFileCtx->pCacheFile, &pGroup->fileId, sizeof(pGroup->fileId));
451
  }
452
}
453

454
static FORCE_INLINE void groupCacheSwitchNewFile(SGcFileCacheCtx* pFileCtx, int32_t downstreamIdx, int32_t vgId, bool removeCheck) {
455
  if (pFileCtx->fileSize < GROUP_CACHE_DEFAULT_MAX_FILE_SIZE) {
583,015✔
456
    return;
583,015✔
457
  }
458

459
  if (removeCheck) {
×
460
    chkRemoveVgroupCurrFile(pFileCtx, downstreamIdx, vgId);
461
  }
462
      
463
  pFileCtx->fileId++;
×
464
  pFileCtx->fileSize = 0;
×
465
}
466

467

468
static int32_t addBlkToBufCache(struct SOperatorInfo* pOperator, SSDataBlock* pBlock, SGcDownstreamCtx* pCtx, SGroupCacheData* pGroup, SGcBlkBufInfo* pBufInfo) {
578,335✔
469
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
578,335✔
470
  int64_t bufSize = blockDataGetSize(pBlock) + sizeof(int32_t) + taosArrayGetSize(pBlock->pDataBlock) * sizeof(int32_t);
578,335✔
471
  pBufInfo->pBuf = taosMemoryMalloc(bufSize);
578,335✔
472
  if (NULL == pBufInfo->pBuf) {
578,335✔
473
    qError("group cache add block to cache failed, size:%" PRId64, bufSize);
×
474
    return terrno;
×
475
  }
476
  QRY_ERR_RET(blockDataToBuf(pBufInfo->pBuf, pBlock));
578,335✔
477

478
  SGcFileCacheCtx* pFileCtx = pGCache->batchFetch ? &pCtx->fileCtx : &pGroup->pVgCtx->fileCtx;
578,335✔
479

480
  pBufInfo->next = NULL;
578,335✔
481
  pBufInfo->basic.blkId = atomic_add_fetch_64(&pGCache->currentBlkId, 1);
578,335✔
482
  pBufInfo->basic.fileId = pGCache->batchFetch ? pFileCtx->fileId : pGroup->fileId;
578,335✔
483
  pBufInfo->basic.bufSize = bufSize;
578,335✔
484
  pBufInfo->basic.offset = atomic_fetch_add_64(&pFileCtx->fileSize, bufSize);
578,335✔
485
  pBufInfo->pCtx = pCtx;
578,335✔
486
  pBufInfo->groupId = pBlock->info.id.groupId;
578,335✔
487

488
  if (pGCache->batchFetch) {    
578,335✔
489
    groupCacheSwitchNewFile(pFileCtx, pCtx->id, pGroup->vgId, false);
578,335✔
490
  }
491

492
  int32_t code = addBlkToDirtyBufList(pGCache, pCtx, &pGCache->blkCache, pBufInfo);
578,335✔
493

494
  return code;
578,335✔
495
}
496

497
void blockDataDeepClear(SSDataBlock* pDataBlock) {
3,703,138✔
498
  size_t numOfCols = taosArrayGetSize(pDataBlock->pDataBlock);
3,703,138✔
499
  for (int32_t i = 0; i < numOfCols; ++i) {
14,005,028✔
500
    SColumnInfoData* p = taosArrayGet(pDataBlock->pDataBlock, i);
10,301,890✔
501
    if (NULL == p) {
10,301,890✔
502
      qError("fail to get %d col from pDataBlock, numOfCols:%d", i, (int32_t)numOfCols);
×
503
      continue;
×
504
    }
505
    p->pData = NULL;
10,301,890✔
506
    if (IS_VAR_DATA_TYPE(p->info.type)) {
10,301,890✔
507
      p->varmeta.offset = NULL;
65,464✔
508
      p->varmeta.length = 0;
65,464✔
509
      p->varmeta.allocLen = 0;
65,464✔
510
    } else {
511
      p->nullbitmap = NULL;
10,236,426✔
512
    }
513
  }
514
  pDataBlock->info.capacity = 0;
3,703,138✔
515
  pDataBlock->info.rows = 0;
3,703,138✔
516
}
3,703,138✔
517

518
static int32_t buildGroupCacheBaseBlock(SSDataBlock** ppDst, SSDataBlock* pSrc) {
3,703,138✔
519
  *ppDst = taosMemoryMalloc(sizeof(*pSrc));
3,703,138✔
520
  if (NULL == *ppDst) {
3,703,138✔
521
    return terrno;
×
522
  }
523
  (*ppDst)->pBlockAgg = NULL;
3,703,138✔
524
  (*ppDst)->pDataBlock = taosArrayDup(pSrc->pDataBlock, NULL);
3,703,138✔
525
  if (NULL == (*ppDst)->pDataBlock) {
3,703,138✔
526
    taosMemoryFree(*ppDst);
×
527
    return terrno;
×
528
  }
529
  TAOS_MEMCPY(&(*ppDst)->info, &pSrc->info, sizeof(pSrc->info));
3,703,138✔
530
  blockDataDeepClear(*ppDst);
3,703,138✔
531
  
532
  return TSDB_CODE_SUCCESS;
3,703,138✔
533
}
534

535
static int32_t acquireBaseBlockFromList(SGcDownstreamCtx* pCtx, SSDataBlock** ppRes) {
7,422,654✔
536
  taosWLockLatch(&pCtx->blkLock);
7,422,654✔
537
  if (taosArrayGetSize(pCtx->pFreeBlock) <= 0) {
7,422,654✔
538
    taosWUnLockLatch(&pCtx->blkLock);
3,558,195✔
539
    return buildGroupCacheBaseBlock(ppRes, pCtx->pBaseBlock);
3,558,195✔
540
  }
541
  *ppRes = *(SSDataBlock**)taosArrayPop(pCtx->pFreeBlock);
3,864,459✔
542
  taosWUnLockLatch(&pCtx->blkLock);
3,864,459✔
543

544
  return TSDB_CODE_SUCCESS;  
3,864,459✔
545
}
546

547
static int32_t releaseBaseBlockToList(SGcDownstreamCtx* pCtx, SSDataBlock* pBlock) {
3,849,884✔
548
  int32_t code = TSDB_CODE_SUCCESS;
3,849,884✔
549
  
550
  blockDataDeepCleanup(pBlock);
3,849,884✔
551
  taosWLockLatch(&pCtx->blkLock);
3,849,884✔
552
  if (NULL == taosArrayPush(pCtx->pFreeBlock, &pBlock)) {
7,699,768✔
553
    code = terrno;
×
554
  }
555
  taosWUnLockLatch(&pCtx->blkLock);
3,849,884✔
556

557
  return code;
3,849,884✔
558
}
559

560

561
static int32_t buildGroupCacheResultBlock(SGroupCacheOperatorInfo* pGCache, int32_t downstreamIdx, void* pBuf, SSDataBlock** ppRes) {
7,422,654✔
562
  int32_t code = acquireBaseBlockFromList(&pGCache->pDownstreams[downstreamIdx], ppRes);
7,422,654✔
563
  if (code) {
7,422,654✔
564
    return code;
×
565
  }
566
  //TODO OPTIMIZE PERF
567
  return blockDataFromBuf(*ppRes, pBuf);
7,422,654✔
568
}
569

570
static int32_t readBlockFromDisk(SGroupCacheOperatorInfo* pGCache, SGroupCacheData* pGrp, SGcBlkBufBasic* pBasic, void** ppBuf) {
7,422,654✔
571
  SGroupCacheFileFd *pFileFd = NULL;
7,422,654✔
572
  SGcFileCacheCtx* pFileCtx = pGCache->batchFetch ? &pGCache->pDownstreams[pGrp->downstreamIdx].fileCtx : &pGrp->pVgCtx->fileCtx;
7,422,654✔
573
  bool deleted = false;
7,422,654✔
574
  int32_t code = acquireFdFromFileCtx(pFileCtx, pBasic->fileId, &pFileFd, &deleted);
7,422,654✔
575
  if (code) {
7,422,654✔
576
    return code;
×
577
  }
578
  if (deleted) {
7,422,654✔
579
    qError("FileId:%d-%d-%d already be deleted, skip read", pGrp->downstreamIdx, pGrp->vgId, pBasic->fileId);
×
580
    return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
×
581
  }
582
  
583
  int64_t ret = taosLSeekFile(pFileFd->fd, pBasic->offset, SEEK_SET);
7,422,654✔
584
  if (ret < 0) {
7,422,654✔
585
    code = terrno;
×
586
    goto _return;
×
587
  }
588

589
  *ppBuf = taosMemoryMalloc(pBasic->bufSize);
7,422,654✔
590
  if (NULL == *ppBuf) {
7,422,654✔
591
    code = terrno;
×
592
    goto _return;
×
593
  }
594
  
595
  ret = taosReadFile(pFileFd->fd, *ppBuf, pBasic->bufSize);
7,422,654✔
596
  if (ret != pBasic->bufSize) {
7,422,654✔
597
    taosMemoryFreeClear(*ppBuf);
×
598
    code = terrno;
×
599
    goto _return;
×
600
  }
601

602
  qTrace("FileId:%d-%d-%d blk %" PRIu64 " size %" PRIu64 " read from offset %" PRIu64, 
7,422,654✔
603
      pGrp->downstreamIdx, pGrp->vgId, pBasic->fileId, pBasic->blkId, pBasic->bufSize, pBasic->offset);
604

605
_return:
7,422,654✔
606

607
  releaseFdToFileCtx(pFileFd);
7,422,654✔
608
  return code;
7,422,654✔
609
}
610

611
static int32_t retrieveBlkFromBufCache(SGroupCacheOperatorInfo* pGCache, SGroupCacheData* pGrp, int64_t sessionId, SGcBlkBufBasic* pBasic, SSDataBlock** ppRes) {
7,422,654✔
612
  int32_t code = TSDB_CODE_SUCCESS;
7,422,654✔
613
  SGcBlkCacheInfo* pCache = &pGCache->blkCache;
7,422,654✔
614
  void* pBuf = NULL;
7,422,654✔
615

616
  SGcBlkBufInfo* pBufInfo = taosHashAcquire(pCache->pDirtyBlk, &pBasic->blkId, sizeof(pBasic->blkId));
7,422,654✔
617
  if (NULL == pBufInfo) {
7,422,654✔
618
    code = readBlockFromDisk(pGCache, pGrp, pBasic, &pBuf);
7,422,654✔
619
    if (code) {
7,422,654✔
620
      return code;
×
621
    }
622
  } else {
623
    pBuf = pBufInfo->pBuf;
×
624
  }
625
  
626
  code = buildGroupCacheResultBlock(pGCache, pGrp->downstreamIdx, pBuf, ppRes);
7,422,654✔
627
  taosHashRelease(pCache->pDirtyBlk, pBufInfo);
7,422,654✔
628
  if (NULL == pBufInfo) {
7,422,654✔
629
    taosMemoryFree(pBuf);
7,422,654✔
630
  }
631
  
632
  if (code) {
7,422,654✔
633
    return code;
×
634
  }
635

636
  QRY_ERR_RET(taosHashPut(pCache->pReadBlk, &sessionId, sizeof(sessionId), ppRes, POINTER_BYTES));
7,422,654✔
637
  
638
  return TSDB_CODE_SUCCESS;
7,422,654✔
639
}
640

641
static FORCE_INLINE void initGcVgroupCtx(SOperatorInfo* pOperator, SGcVgroupCtx* pVgCtx, int32_t downstreamId, int32_t vgId, SArray* pTbList) {
642
  pVgCtx->pTbList = pTbList;
2,393,816✔
643
  pVgCtx->id = vgId;
2,393,816✔
644
  (void)snprintf(pVgCtx->fileCtx.baseFilename, sizeof(pVgCtx->fileCtx.baseFilename) - 1, "%s/gc_%d_%" PRIx64 "_%" PRIu64 "_%p_%d_%d", 
4,787,632✔
645
     tsTempDir, taosGetPId(), pOperator->pTaskInfo->id.queryId, pOperator->pTaskInfo->id.taskId, pOperator, downstreamId, vgId);
4,787,632✔
646
  pVgCtx->fileCtx.baseFilename[sizeof(pVgCtx->fileCtx.baseFilename) - 1] = 0;
2,393,816✔
647

648
  pVgCtx->fileCtx.baseNameLen = strlen(pVgCtx->fileCtx.baseFilename);
2,393,816✔
649
}
2,393,816✔
650

651
static int32_t addNewGroupToVgHash(SOperatorInfo* pOperator, SSHashObj* pHash, SGcNewGroupInfo* pNew) {
4,680✔
652
  SGcVgroupCtx* pVgCtx = pNew->pGroup->pVgCtx;
4,680✔
653
  if (NULL == pVgCtx) {
4,680✔
654
    SArray* pList = taosArrayInit(10, sizeof(*pNew));
2,340✔
655
    if (NULL == pList) {
2,340✔
656
      return terrno;
×
657
    }
658
    if (NULL == taosArrayPush(pList, pNew)) {
2,340✔
659
      QRY_ERR_RET(terrno);
×
660
    }
661
    
662
    SGcVgroupCtx vgCtx = {0};
2,340✔
663
    initGcVgroupCtx(pOperator, &vgCtx, pNew->pGroup->downstreamIdx, pNew->vgId, pList);
2,340✔
664
    QRY_ERR_RET(tSimpleHashPut(pHash, &pNew->vgId, sizeof(pNew->vgId), &vgCtx, sizeof(vgCtx)));
2,340✔
665
    
666
    pNew->pGroup->pVgCtx = tSimpleHashGet(pHash, &pNew->vgId, sizeof(pNew->vgId));
2,340✔
667
    if (NULL == pNew->pGroup->pVgCtx) {
2,340✔
668
      qError("fail to get vg %d ctx from vgHash", pNew->vgId);
×
669
      QRY_ERR_RET(TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
×
670
    }
671
    
672
    return TSDB_CODE_SUCCESS;
2,340✔
673
  }
674

675
  if (NULL == taosArrayPush(pVgCtx->pTbList, pNew)) {
4,680✔
676
    QRY_ERR_RET(terrno);
×
677
  }
678
  
679
  return TSDB_CODE_SUCCESS;
2,340✔
680
}
681

682
static FORCE_INLINE int32_t appendNewGroupToDownstream(struct SOperatorInfo* pOperator, int32_t downstreamIdx, SOperatorParam** ppParam) {
683
  int32_t code = TSDB_CODE_SUCCESS;
714,650✔
684
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
714,650✔
685
  SGcDownstreamCtx* pCtx = &pGCache->pDownstreams[downstreamIdx];  
714,650✔
686
  SOperatorParam* pDst = NULL;
714,650✔
687
  
688
  taosWLockLatch(&pCtx->grpLock);
714,650✔
689
  int32_t num = taosArrayGetSize(pCtx->pNewGrpList);
714,650✔
690
  if (num <= 0) {
714,650✔
691
    goto _return;
560,520✔
692
  }
693

694
  for (int32_t i = 0; i < num; ++i) {
308,260✔
695
    SGcNewGroupInfo* pNew = taosArrayGet(pCtx->pNewGrpList, i);
154,130✔
696
    if (NULL == pNew) {
154,130✔
697
      qError("fail to get vg %d SGcNewGroupInfo from pNewGrpList", i);
×
698
      QRY_ERR_RET(TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
×
699
    }
700
    
701
    if (!pGCache->batchFetch) {
154,130✔
702
      code = addNewGroupToVgHash(pOperator, pCtx->pVgTbHash, pNew);
4,680✔
703
      if (code) {
4,680✔
704
        goto _return;
×
705
      }
706
    }
707

708
    if (NULL == pDst) {
154,130✔
709
      pDst = pNew->pParam;
154,130✔
710
    } else if (pNew->pParam) {
×
711
      code = mergeOperatorParams(pDst, pNew->pParam);
×
712
      if (code) {
×
713
        goto _return;
×
714
      }
715
    }
716
  }
717

718
  taosArrayClear(pCtx->pNewGrpList);
154,130✔
719
  
720
_return:
714,650✔
721

722
  taosWUnLockLatch(&pCtx->grpLock);
714,650✔
723
  *ppParam = pDst;
714,650✔
724
  
725
  return code;
714,650✔
726
}
727

728
static FORCE_INLINE int32_t getBlkFromDownstreamOperator(struct SOperatorInfo* pOperator, int32_t downstreamIdx,
729
                                                         SSDataBlock** ppRes) {
730
  int32_t                  code = TSDB_CODE_SUCCESS;
714,650✔
731
  SOperatorParam*          pDownstreamParam = NULL;
1,429,300✔
732
  SSDataBlock*             pBlock = NULL;
714,650✔
733
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
714,650✔
734

735
  code = appendNewGroupToDownstream(pOperator, downstreamIdx, &pDownstreamParam);
714,650✔
736
  if (code) {
714,650✔
737
    return code;
×
738
  }
739

740
  SOperatorInfo* pDownstream = pOperator->pDownstream[downstreamIdx];
714,650✔
741
  if (pDownstreamParam) {
714,650✔
742
    code = pDownstream->fpSet.getNextExtFn(pDownstream, pDownstreamParam, &pBlock);
154,130✔
743
  } else {
744
    code = pDownstream->fpSet.getNextFn(pDownstream, &pBlock);
560,520✔
745
  }
746

747
  if (code) {
714,650✔
748
    qError("failed to get block from downstream, code:%s %s", tstrerror(code), GET_TASKID(pOperator->pTaskInfo));
×
749
    return code;
×
750
  }
751

752
  if (pBlock) {
714,650✔
753
    qDebug("%s res block retrieved from group %" PRIu64, GET_TASKID(pOperator->pTaskInfo), pBlock->info.id.groupId);
583,015✔
754

755
    pGCache->execInfo.pDownstreamBlkNum[downstreamIdx]++;
583,015✔
756
    if (NULL == pGCache->pDownstreams[downstreamIdx].pBaseBlock) {
583,015✔
757
      code = buildGroupCacheBaseBlock(&pGCache->pDownstreams[downstreamIdx].pBaseBlock, pBlock);
144,943✔
758
      if (code) {
144,943✔
759
        return code;
×
760
      }
761

762
      if (NULL == taosArrayPush(pGCache->pDownstreams[downstreamIdx].pFreeBlock,
289,886✔
763
                                &pGCache->pDownstreams[downstreamIdx].pBaseBlock)) {
144,943✔
764
        QRY_ERR_RET(terrno);
×
765
      }
766
    }
767
  }
768

769
  code = blockDataCheck(pBlock);
714,650✔
770

771
  *ppRes = pBlock;
714,650✔
772
  return code;
714,650✔
773
}
774

775
static int32_t notifyWaitingSessions(SArray* pWaitQueue) {
1,118,246✔
776
  if (NULL == pWaitQueue || taosArrayGetSize(pWaitQueue) <= 0) {
1,118,246✔
777
    return TSDB_CODE_SUCCESS;
1,118,246✔
778
  }
779
  
780
  int32_t n = taosArrayGetSize(pWaitQueue);
×
781
  for (int32_t i = 0; i < n; ++i) {
×
782
    SGcSessionCtx* pSession = taosArrayGetP(pWaitQueue, i);
×
783
    if (NULL == pSession) {
×
784
      qError("fail to get %d SGcSessionCtx in pWaitQueue, total:%d", i, n);
×
785
      QRY_ERR_RET(TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
×
786
    }
787
    
788
    QRY_ERR_RET(tsem_post(&pSession->waitSem));
×
789
  }
790

791
  return TSDB_CODE_SUCCESS;
×
792
}
793

794
static FORCE_INLINE int32_t handleGroupFetchDone(SGroupCacheData* pGroup) {
795
  int32_t code = TSDB_CODE_SUCCESS;
535,231✔
796
  pGroup->pBlock = NULL;
535,231✔
797
  atomic_store_8((int8_t*)&pGroup->fetchDone, true);
535,231✔
798
  
799
  (void)taosThreadMutexLock(&pGroup->mutex);
535,231✔
800
  code = notifyWaitingSessions(pGroup->waitQueue);
535,231✔
801
  taosArrayClear(pGroup->waitQueue);
535,231✔
802
  (void)taosThreadMutexUnlock(&pGroup->mutex);
535,231✔
803

804
  return code;
535,231✔
805
}
806

807
static int32_t addFileRefTableNum(SGcFileCacheCtx* pFileCtx, int32_t fileId, int32_t downstreamId, int32_t vgId) {
×
808
  if (NULL == pFileCtx->pCacheFile) {
×
809
    pFileCtx->pCacheFile = taosHashInit(10, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT), false, HASH_ENTRY_LOCK);
×
810
    if (NULL == pFileCtx->pCacheFile) {
×
811
      return terrno;
×
812
    }
813
    taosHashSetFreeFp(pFileCtx->pCacheFile, freeSGroupCacheFileInfo);
×
814
  }
815
  
816
  SGroupCacheFileInfo* pTmp = taosHashGet(pFileCtx->pCacheFile, &fileId, sizeof(fileId));
×
817
  if (NULL == pTmp) {
×
818
    (void)snprintf(&pFileCtx->baseFilename[pFileCtx->baseNameLen], sizeof(pFileCtx->baseFilename) - pFileCtx->baseNameLen, "_%u", fileId);
×
819

820
    SGroupCacheFileInfo newFile = {0};
×
821
    newFile.groupNum = 1;
×
822
    QRY_ERR_RET(taosHashPut(pFileCtx->pCacheFile, &fileId, sizeof(fileId), &newFile, sizeof(newFile)));
×
823
    pTmp = taosHashGet(pFileCtx->pCacheFile, &fileId, sizeof(fileId));
×
824
    if (NULL == pTmp) {
×
825
      qError("fail to get file %d in pCacheFile", fileId);
×
826
      QRY_ERR_RET(TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
×
827
    }
828
  } else {
829
    pTmp->groupNum++;
×
830
  }
831

832
  qTrace("FileId:%d-%d-%d add groupNum to %u", downstreamId, vgId, fileId, pTmp->groupNum);
×
833

834
  return TSDB_CODE_SUCCESS;
×
835
}
836

837
static int32_t handleVgroupTableFetchDone(SGcDownstreamCtx* pCtx, SGroupCacheData* pGroup, uint64_t uid) {
4,680✔
838
  if (pCtx->lastBlkUid == uid || pGroup->pVgCtx->lastBlkUid == uid) {
4,680✔
839
    return TSDB_CODE_SUCCESS;
×
840
  }
841
  
842
  pCtx->lastBlkUid = uid;
4,680✔
843
  pGroup->pVgCtx->lastBlkUid = uid;
4,680✔
844
  
845
  int32_t i = 0;
4,680✔
846
  while (true) {
×
847
    SGcNewGroupInfo* pNew = taosArrayGet(pGroup->pVgCtx->pTbList, i++);
4,680✔
848
    if (NULL == pNew || pNew->uid == uid) {
4,680✔
849
      break;
850
    }
851
    QRY_ERR_RET(handleGroupFetchDone(pNew->pGroup));
×
852
  }
853

854
  groupCacheSwitchNewFile(&pGroup->pVgCtx->fileCtx, pGroup->downstreamIdx, pGroup->vgId, true);
4,680✔
855

856
  pGroup->fileId = pGroup->pVgCtx->fileCtx.fileId;
4,680✔
857
  pGroup->startOffset = pGroup->pVgCtx->fileCtx.fileSize;
4,680✔
858

859
  qTrace("FileId:%d-%d-%d add groupNum for group %" PRIu64, pGroup->downstreamIdx, pGroup->vgId, pGroup->pVgCtx->fileCtx.fileId, uid);
4,680✔
860

861
  if (pGroup->needCache) {
4,680✔
862
    return addFileRefTableNum(&pGroup->pVgCtx->fileCtx, pGroup->pVgCtx->fileCtx.fileId, pGroup->downstreamIdx, pGroup->vgId);
×
863
  }
864

865
  return TSDB_CODE_SUCCESS;
4,680✔
866
}
867

868

869
static FORCE_INLINE int32_t initNewGroupData(SGcDownstreamCtx* pCtx, SGroupCacheData* pGroup, int32_t downstreamIdx, int32_t vgId, bool batchFetch, bool needCache) {
870
  QRY_ERR_RET(taosThreadMutexInit(&pGroup->mutex, NULL));
591,289✔
871
  
872
  pGroup->downstreamIdx = downstreamIdx;
591,289✔
873
  pGroup->vgId = vgId;
591,289✔
874
  pGroup->fileId = -1;
591,289✔
875
  pGroup->blkList.pList = taosArrayInit(10, sizeof(SGcBlkBufBasic));
591,289✔
876
  if (NULL == pGroup->blkList.pList) {
591,289✔
877
    QRY_ERR_RET(terrno);
×
878
  }
879
  pGroup->startOffset = -1;
591,289✔
880
  pGroup->needCache = needCache;
591,289✔
881
  pGroup->pVgCtx = tSimpleHashGet(pCtx->pVgTbHash, &pGroup->vgId, sizeof(pGroup->vgId));
591,289✔
882

883
  return TSDB_CODE_SUCCESS;
591,289✔
884
}
885

886
static int32_t addNewGroupData(struct SOperatorInfo* pOperator, SOperatorParam* pParam, SGroupCacheData** ppGrp, int32_t vgId, int64_t uid) {
591,289✔
887
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
591,289✔
888
  SGcDownstreamCtx* pCtx = &pGCache->pDownstreams[pParam->downstreamIdx];
591,289✔
889
  SGcOperatorParam* pGcParam = pParam->value;  
591,289✔
890
  SHashObj* pGrpHash = pGCache->globalGrp ? pGCache->pGrpHash : pCtx->pGrpHash;
591,289✔
891
  SGroupCacheData grpData = {0};
591,289✔
892
  
893
  while (true) {
894
    if (0 != taosHashPut(pGrpHash, &uid, sizeof(uid), &grpData, sizeof(grpData))) {
591,289✔
895
      if (terrno == TSDB_CODE_DUP_KEY) {
×
896
        *ppGrp = taosHashGet(pGrpHash, &uid, sizeof(uid));
×
897
        if (*ppGrp) {
×
898
          break;
×
899
        }
900
      } else {
901
        return terrno;
×
902
      }
903
    }
904

905
    break;
591,289✔
906
  }
907

908
  *ppGrp = taosHashGet(pGrpHash, &uid, sizeof(uid));
591,289✔
909
  if (NULL == *ppGrp) {
591,289✔
910
    return terrno;
×
911
  }
912
  QRY_ERR_RET(initNewGroupData(pCtx, *ppGrp, pParam->downstreamIdx, vgId, pGCache->batchFetch, pGcParam->needCache));
1,182,578✔
913

914
  qDebug("new group %" PRIu64 " initialized, downstreamIdx:%d, vgId:%d, needCache:%d", uid, pParam->downstreamIdx, vgId, pGcParam->needCache);
591,289✔
915

916
  if (pParam->pChildren) {
591,289✔
917
    SGcNewGroupInfo newGroup;
154,130✔
918
    newGroup.pGroup = *ppGrp;
154,130✔
919
    newGroup.vgId = vgId;
154,130✔
920
    newGroup.uid = uid;
154,130✔
921
    newGroup.pParam = taosArrayGetP(pParam->pChildren, 0);
154,130✔
922
    
923
    taosWLockLatch(&pCtx->grpLock);
154,130✔
924
    if (NULL == taosArrayPush(pCtx->pNewGrpList, &newGroup)) {
308,260✔
925
      taosWUnLockLatch(&pCtx->grpLock);
×
926
      return terrno;
×
927
    }
928
    taosWUnLockLatch(&pCtx->grpLock);
154,130✔
929
    
930
    taosArrayDestroy(pParam->pChildren);
154,130✔
931
    pParam->pChildren = NULL;
154,130✔
932
    pCtx->fetchDone = false;
154,130✔
933
  }
934

935
  return TSDB_CODE_SUCCESS;
591,289✔
936
}
937

938
static int32_t addBlkToGroupCache(bool batchFetch, SGroupCacheData* pGroup, SGcBlkBufInfo* pNewBlk, int64_t* pIdx) {
578,335✔
939
  taosWLockLatch(&pGroup->blkList.lock);
578,335✔
940
  if (NULL == taosArrayPush(pGroup->blkList.pList, &pNewBlk->basic)) {
1,156,670✔
941
    QRY_ERR_RET(terrno);
×
942
  }
943
  *pIdx = taosArrayGetSize(pGroup->blkList.pList) - 1;
578,335✔
944
  taosWUnLockLatch(&pGroup->blkList.lock);
578,335✔
945

946
  qDebug("block added to group cache, total block num:%" PRId64, *pIdx + 1);
578,335✔
947
  
948
  return TSDB_CODE_SUCCESS;
578,335✔
949
}
950

951
static int32_t handleGroupCacheRetrievedBlk(struct SOperatorInfo* pOperator, SSDataBlock* pBlock, SGcSessionCtx* pSession, bool* continueFetch) {
583,015✔
952
  int32_t code = TSDB_CODE_SUCCESS;
583,015✔
953
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
583,015✔
954
  SGcDownstreamCtx* pCtx = &pGCache->pDownstreams[pSession->downstreamIdx];
583,015✔
955
  SHashObj* pGrpHash = pGCache->globalGrp ? pGCache->pGrpHash : pCtx->pGrpHash;
583,015✔
956
  int64_t newBlkIdx = 0;
583,015✔
957

958
  SGroupCacheData* pGroup = taosHashGet(pGrpHash, &pBlock->info.id.groupId, sizeof(pBlock->info.id.groupId));
583,015✔
959
  if (NULL == pGroup) {
583,015✔
960
    if (pGCache->batchFetch) {
423,678✔
961
      SGcOperatorParam fakeGcParam = {0};
423,678✔
962
      SOperatorParam fakeParam = {0};
423,678✔
963
      fakeGcParam.needCache = true;
423,678✔
964
      fakeParam.downstreamIdx = pSession->downstreamIdx;
423,678✔
965
      fakeParam.value = &fakeGcParam;
423,678✔
966
      fakeParam.reUse = false;
423,678✔
967
      code = addNewGroupData(pOperator, &fakeParam, &pGroup, GROUP_CACHE_DEFAULT_VGID, pBlock->info.id.groupId);
423,678✔
968
      if (TSDB_CODE_SUCCESS != code) {
423,678✔
969
        return code;
×
970
      }
971
    } else {
972
      qError("group %" PRIu64 " not found in group hash", pBlock->info.id.groupId);
×
973
      return TSDB_CODE_INVALID_PARA;
×
974
    }
975
  }
976

977
  if (!pGCache->batchFetch) {
583,015✔
978
    code = handleVgroupTableFetchDone(pCtx, pGroup, pBlock->info.id.groupId);
4,680✔
979
    if (TSDB_CODE_SUCCESS != code) {
4,680✔
980
      return code;
×
981
    }
982
  }
983

984
  if (pGroup->needCache) {
583,015✔
985
    qDebug("add block to group cache");
578,335✔
986
    
987
    SGcBlkBufInfo newBlkBuf;    
578,335✔
988
    code = addBlkToBufCache(pOperator, pBlock, pCtx, pGroup, &newBlkBuf);
578,335✔
989
    if (code) {
578,335✔
990
      return code;
×
991
    }
992

993
    code = addBlkToGroupCache(pGCache->batchFetch, pGroup, &newBlkBuf, &newBlkIdx);
578,335✔
994
    if (code) {
578,335✔
995
      return code;
×
996
    }
997
  } else {
998
    qDebug("no need to add block to group cache");
4,680✔
999
    
1000
    pGroup->pBlock = pBlock;
4,680✔
1001
  }
1002

1003
  QRY_ERR_RET(notifyWaitingSessions(pGroup->waitQueue));
583,015✔
1004
  if (pGroup == pSession->pGroupData) {
583,015✔
1005
    if (pGroup->needCache) {
159,337✔
1006
      pSession->lastBlkId = newBlkIdx;
154,657✔
1007
    }
1008
    
1009
    *continueFetch = false;
159,337✔
1010
  }
1011

1012
  return TSDB_CODE_SUCCESS;
583,015✔
1013
}
1014

1015
static int32_t handleDownstreamFetchDone(struct SOperatorInfo* pOperator, SGcSessionCtx* pSession) {
131,635✔
1016
  int32_t code = TSDB_CODE_SUCCESS;
131,635✔
1017
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
131,635✔
1018
  SGcDownstreamCtx* pCtx = &pGCache->pDownstreams[pSession->downstreamIdx];  
131,635✔
1019
  if (pGCache->batchFetch) {
131,635✔
1020
    SHashObj* pGrpHash = pGCache->globalGrp ? pGCache->pGrpHash : pCtx->pGrpHash;
126,955✔
1021
    SGroupCacheData* pGroup = NULL;
126,955✔
1022
    while (NULL != (pGroup = taosHashIterate(pGrpHash, pGroup))) {
657,506✔
1023
      QRY_ERR_RET(handleGroupFetchDone(pGroup));
530,551✔
1024
    }
1025
    pCtx->fetchDone = true;
126,955✔
1026
  } else {
1027
    int32_t uidNum = 0;
4,680✔
1028
    SGcVgroupCtx* pVgCtx = NULL;
4,680✔
1029
    int32_t iter = 0;
4,680✔
1030
    while (NULL != (pVgCtx = tSimpleHashIterate(pCtx->pVgTbHash, pVgCtx, &iter))) {
9,360✔
1031
      uidNum = taosArrayGetSize(pVgCtx->pTbList);
4,680✔
1032
      for (int32_t i = 0; i < uidNum; ++i) {
9,360✔
1033
        SGcNewGroupInfo* pNew = taosArrayGet(pVgCtx->pTbList, i);
4,680✔
1034
        QRY_ERR_RET(handleGroupFetchDone(pNew->pGroup));
9,360✔
1035
      }
1036
      taosArrayClear(pVgCtx->pTbList);
4,680✔
1037
    }    
1038
  }
1039

1040
  taosHashClear(pCtx->pWaitSessions);
131,635✔
1041

1042
  return TSDB_CODE_SUCCESS;
131,635✔
1043
}
1044

1045
static int32_t getCacheBlkFromDownstreamOperator(struct SOperatorInfo* pOperator, SGcDownstreamCtx* pCtx, int64_t sessionId, SGcSessionCtx* pSession, SSDataBlock** ppRes) {
290,972✔
1046
  bool continueFetch = true;
290,972✔
1047
  int32_t code = TSDB_CODE_SUCCESS;
290,972✔
1048
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
290,972✔
1049

1050
  while (continueFetch && TSDB_CODE_SUCCESS == code) {
873,987✔
1051
    QRY_ERR_RET(getBlkFromDownstreamOperator(pOperator, pSession->downstreamIdx, ppRes));
1,429,300✔
1052
    
1053
    if (NULL == *ppRes) {
714,650✔
1054
      QRY_ERR_RET(handleDownstreamFetchDone(pOperator, pSession));
131,635✔
1055
      break;
131,635✔
1056
    } else {
1057
      QRY_ERR_RET(handleGroupCacheRetrievedBlk(pOperator, *ppRes, pSession, &continueFetch));
583,015✔
1058
    }
1059
  }
1060

1061
  if (!continueFetch) {
290,972✔
1062
    SGcSessionCtx** ppWaitCtx = taosHashIterate(pCtx->pWaitSessions, NULL);
159,337✔
1063
    if (ppWaitCtx) {
159,337✔
1064
      taosHashCancelIterate(pCtx->pWaitSessions, ppWaitCtx);
×
1065
      int64_t* pSessionId = taosHashGetKey(ppWaitCtx, NULL);
×
1066
      if (sessionId != atomic_val_compare_exchange_64(&pCtx->fetchSessionId, sessionId, *pSessionId)) {
×
1067
        qError("wrong fetch sessionId: %" PRIu64 " expected: %" PRIu64 , pCtx->fetchSessionId, sessionId);
×
1068
        return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
×
1069
      }
1070
      SGcSessionCtx* pWaitCtx = *ppWaitCtx;
×
1071
      pWaitCtx->newFetch = true;
×
1072
      code = taosHashRemove(pCtx->pWaitSessions, pSessionId, sizeof(*pSessionId));
×
1073
      if (code) {
×
1074
        qError("taosHashRemove session %" PRId64 " from waitSession failed, error: %s", *pSessionId, tstrerror(code));
×
1075
        return code;
×
1076
      }
1077
      QRY_ERR_RET(tsem_post(&pWaitCtx->waitSem));
×
1078

1079
      return code;
×
1080
    }
1081
  }
1082

1083
  if (sessionId != atomic_val_compare_exchange_64(&pCtx->fetchSessionId, sessionId, -1)) {
290,972✔
1084
    qError("wrong fetch sessionId: %" PRIu64 " expected: %" PRIu64 , pCtx->fetchSessionId, sessionId);
×
1085
    return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
×
1086
  }
1087
  
1088
  return code;
290,972✔
1089
}
1090

1091
static int32_t getBlkFromSessionCacheImpl(struct SOperatorInfo* pOperator, int64_t sessionId, SGcSessionCtx* pSession, SSDataBlock** ppRes, bool* got) {
11,566,730✔
1092
  int32_t code = TSDB_CODE_SUCCESS;
11,566,730✔
1093
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
11,566,730✔
1094
  *got = true;
11,566,730✔
1095

1096
  if (NULL != pSession->pGroupData) {
11,566,730✔
1097
    if (pSession->pGroupData->needCache) {
11,566,730✔
1098
      SGcBlkList* pBlkList = &pSession->pGroupData->blkList;
11,552,690✔
1099
      taosRLockLatch(&pBlkList->lock);
11,552,690✔
1100
      int64_t blkNum = taosArrayGetSize(pBlkList->pList);
11,552,690✔
1101
      if (pSession->lastBlkId < 0) {
11,552,690✔
1102
        if (blkNum > 0) {
7,585,585✔
1103
          SGcBlkBufBasic* pBasic = taosArrayGet(pBlkList->pList, 0);
7,422,654✔
1104
          taosRUnLockLatch(&pBlkList->lock);
7,422,654✔
1105
          code = retrieveBlkFromBufCache(pGCache, pSession->pGroupData, sessionId, pBasic, ppRes);
7,422,654✔
1106
          pSession->lastBlkId = 0;
7,422,654✔
1107
          return code;
7,422,654✔
1108
        }
1109
      } else if ((pSession->lastBlkId + 1) < blkNum) {
3,967,105✔
1110
        SGcBlkBufBasic* pBasic = taosArrayGet(pBlkList->pList, pSession->lastBlkId + 1);
×
1111
        taosRUnLockLatch(&pBlkList->lock);
×
1112
        code = retrieveBlkFromBufCache(pGCache, pSession->pGroupData, sessionId, pBasic, ppRes);
×
1113
        pSession->lastBlkId++;
×
1114
        return code;
×
1115
      }
1116
      taosRUnLockLatch(&pBlkList->lock);
4,130,036✔
1117
    } else if (pSession->pGroupData->pBlock) {
14,040✔
1118
      *ppRes = pSession->pGroupData->pBlock;
4,680✔
1119
      pSession->pGroupData->pBlock = NULL;
4,680✔
1120
      return TSDB_CODE_SUCCESS;
4,680✔
1121
    }
1122

1123
    if (atomic_load_8((int8_t*)&pSession->pGroupData->fetchDone)) {
4,139,396✔
1124
      *ppRes = NULL;
3,848,424✔
1125
      qDebug("sessionId: %" PRIu64 " fetch done", sessionId);
3,848,424✔
1126
      return code;
3,848,424✔
1127
    }
1128
  } else {
1129
    *ppRes = NULL;
×
1130
    qDebug("sessionId: %" PRIu64 " fetch done since downstream fetch done", sessionId);
×
1131
    return code;
×
1132
  }
1133

1134
  *got = false;
290,972✔
1135
  return code;
290,972✔
1136
}
1137

1138

1139
static int32_t groupCacheSessionWait(struct SOperatorInfo* pOperator, SGcDownstreamCtx* pCtx, int64_t sessionId, SGcSessionCtx* pSession, SSDataBlock** ppRes) {
×
1140
  // FOR NOW, IT'S ERROR TO REACH HERE
1141
#if 1
1142
  qError("should not enter session wait");
×
1143
  return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
×
1144
#else
1145
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
1146
  SGroupCacheData* pGroup = pSession->pGroupData;
1147
  int32_t code = TSDB_CODE_SUCCESS;
1148
  bool inLock = true;
1149
  if (NULL == pGroup->waitQueue) {
1150
    pGroup->waitQueue = taosArrayInit(1, POINTER_BYTES);
1151
    if (NULL == pGroup->waitQueue) {
1152
      QRY_ERR_JRET(terrno);
1153
    }
1154
  }
1155
  
1156
  if (NULL == taosArrayPush(pGroup->waitQueue, &pSession)) {
1157
    QRY_ERR_JRET(terrno);
1158
  }
1159

1160
  if (!pSession->semInit) {
1161
    QRY_ERR_JRET(tsem_init(&pSession->waitSem, 0, 0));
1162
    pSession->semInit = true;
1163
  }
1164

1165
  (void)taosThreadMutexUnlock(&pSession->pGroupData->mutex);
1166
  inLock = false;
1167

1168
  QRY_ERR_JRET(taosHashPut(pCtx->pWaitSessions, &sessionId, sizeof(sessionId), &pSession, POINTER_BYTES));
1169

1170
  code = tsem_wait(&pSession->waitSem);
1171
  if (code) {
1172
    qError("tsem_wait failed, error:%s", tstrerror(code));
1173
    QRY_ERR_JRET(code);
1174
  }
1175

1176
  if (pSession->newFetch) {
1177
    pSession->newFetch = false;
1178
    return getCacheBlkFromDownstreamOperator(pOperator, pCtx, sessionId, pSession, ppRes);
1179
  }
1180

1181
  code = taosHashRemove(pCtx->pWaitSessions, &sessionId, sizeof(sessionId));
1182
  if (code) {
1183
    qError("taosHashRemove session %" PRId64 " from waitSession failed, error: %s", sessionId, tstrerror(code));
1184
    QRY_ERR_JRET(code);
1185
  }
1186

1187
  bool got = false;
1188
  return getBlkFromSessionCacheImpl(pOperator, sessionId, pSession, ppRes, &got);
1189

1190
_return:
1191

1192
  if (inLock) {
1193
    (void)taosThreadMutexUnlock(&pSession->pGroupData->mutex);
1194
  }
1195

1196
  return code;
1197
#endif
1198
}
1199

1200

1201
static int32_t getBlkFromSessionCache(struct SOperatorInfo* pOperator, int64_t sessionId, SGcSessionCtx* pSession, SSDataBlock** ppRes) {
11,566,730✔
1202
  int32_t code = TSDB_CODE_SUCCESS;
11,566,730✔
1203
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
11,566,730✔
1204
  bool locked = false;
11,566,730✔
1205
  SGcDownstreamCtx* pCtx = &pGCache->pDownstreams[pSession->downstreamIdx];
11,566,730✔
1206
  
1207
  while (true) {
×
1208
    bool got = false;
11,566,730✔
1209
    code = getBlkFromSessionCacheImpl(pOperator, sessionId, pSession, ppRes, &got);
11,566,730✔
1210
    if (TSDB_CODE_SUCCESS != code || got) {
11,566,730✔
1211
      goto _return;
11,275,758✔
1212
    }
1213
    
1214
    if ((atomic_load_64(&pCtx->fetchSessionId) == sessionId)
290,972✔
1215
      || (-1 == atomic_val_compare_exchange_64(&pCtx->fetchSessionId, -1, sessionId))) {
290,972✔
1216
      if (locked) {
290,972✔
1217
        (void)taosThreadMutexUnlock(&pSession->pGroupData->mutex);
×
1218
        locked = false;
×
1219
      }
1220
      
1221
      code = getCacheBlkFromDownstreamOperator(pOperator, pCtx, sessionId, pSession, ppRes);
290,972✔
1222
      goto _return;
290,972✔
1223
    } else {
1224
      // FOR NOW, SHOULD NOT REACH HERE
1225
      qError("Invalid fetchSessionId:%" PRId64 ", currentSessionId:%" PRId64, pCtx->fetchSessionId, sessionId);
×
1226
      return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
×
1227
    }
1228

1229
    if (locked) {
1230
      code = groupCacheSessionWait(pOperator, pCtx, sessionId, pSession, ppRes);
1231
      locked = false;
1232
      if (TSDB_CODE_SUCCESS != code) {
1233
        goto _return;
1234
      }
1235
      
1236
      break;
1237
    }
1238
    
1239
    (void)taosThreadMutexLock(&pSession->pGroupData->mutex);
1240
    locked = true;
1241
  };
1242

1243

1244
_return:
11,566,730✔
1245

1246
  if (locked) {
11,566,730✔
1247
    (void)taosThreadMutexUnlock(&pSession->pGroupData->mutex);
×
1248
  }
1249

1250
  return code;
11,566,730✔
1251
}
1252

1253

1254
static int32_t initGroupCacheBlockCache(SGroupCacheOperatorInfo* pInfo) {
1,195,276✔
1255
  SGcBlkCacheInfo* pCache = &pInfo->blkCache;
1,195,276✔
1256
  pCache->pDirtyBlk = taosHashInit(10, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), false, HASH_ENTRY_LOCK);
1,195,276✔
1257
  if (NULL == pCache->pDirtyBlk) {
1,195,276✔
1258
    return terrno;
×
1259
  }
1260
  taosHashSetFreeFp(pCache->pDirtyBlk, freeGcBlkBufInfo);
1,195,276✔
1261
  pCache->pReadBlk = taosHashInit(10, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), false, HASH_ENTRY_LOCK);
1,195,276✔
1262
  if (NULL == pCache->pReadBlk) {
1,195,276✔
1263
    return terrno;
×
1264
  }
1265
  pCache->writeDownstreamId = -1;
1,195,276✔
1266

1267
  return TSDB_CODE_SUCCESS;
1,195,276✔
1268
}
1269

1270
static FORCE_INLINE void initGroupCacheSessionCtx(SGcSessionCtx* pSession, SGcOperatorParam* pGcParam, SGroupCacheData* pGroup) {
1271
  pSession->pParam = pGcParam;
7,590,265✔
1272
  pSession->downstreamIdx = pGcParam->downstreamIdx;
7,590,265✔
1273
  pSession->pGroupData = pGroup;
7,590,265✔
1274
  pSession->lastBlkId = -1;
7,590,265✔
1275
}
7,590,265✔
1276

1277
static int32_t initGroupCacheSession(struct SOperatorInfo* pOperator, SOperatorParam* pParam, SGcSessionCtx** ppSession) {
7,609,480✔
1278
  int32_t code = TSDB_CODE_SUCCESS;
7,609,480✔
1279
  SGcSessionCtx ctx = {0};
7,609,480✔
1280
  SGcOperatorParam* pGcParam = pParam->value;  
7,609,480✔
1281
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
7,609,480✔
1282
  SGcDownstreamCtx* pCtx = &pGCache->pDownstreams[pParam->downstreamIdx];
7,609,480✔
1283
  SHashObj* pGrpHash = pGCache->globalGrp ? pGCache->pGrpHash : pCtx->pGrpHash;
7,609,480✔
1284

1285
  SGroupCacheData* pGroup = taosHashGet(pGrpHash, &pGcParam->tbUid, sizeof(pGcParam->tbUid));
7,609,480✔
1286
  if (NULL == pGroup && (NULL != pParam->pChildren || !pCtx->fetchDone)) {
7,609,480✔
1287
    code = addNewGroupData(pOperator, pParam, &pGroup, pGCache->batchFetch ? GROUP_CACHE_DEFAULT_VGID : pGcParam->vgId, pGcParam->tbUid);
167,611✔
1288
    if (TSDB_CODE_SUCCESS != code) {
167,611✔
1289
      return code;
×
1290
    }
1291
  }
1292

1293
  if (NULL == pGroup) {
7,609,480✔
1294
    return TSDB_CODE_SUCCESS;
19,215✔
1295
  }
1296

1297
  initGroupCacheSessionCtx(&ctx, pGcParam, pGroup);
7,590,265✔
1298

1299
  code = taosHashPut(pCtx->pSessions, &pGcParam->sessionId, sizeof(pGcParam->sessionId), &ctx, sizeof(ctx));
7,590,265✔
1300
  if (TSDB_CODE_SUCCESS != code) {
7,590,265✔
1301
    return code;
×
1302
  }
1303

1304
  *ppSession = taosHashGet(pCtx->pSessions, &pGcParam->sessionId, sizeof(pGcParam->sessionId));
7,590,265✔
1305
  if (NULL == *ppSession) {
7,590,265✔
1306
    qError("fail to get session %" PRId64 " from pSessions", pGcParam->sessionId);
×
1307
    QRY_ERR_RET(TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
×
1308
  }
1309

1310
  qDebug("session:%" PRId64 " initialized, downstreamIdx:%d, vgId:%d, tbUid:%" PRId64 ", needCache:%d", 
7,590,265✔
1311
    pGcParam->sessionId, pGcParam->downstreamIdx, pGcParam->vgId, pGcParam->tbUid, pGcParam->needCache);
1312
  
1313
  return TSDB_CODE_SUCCESS;
7,590,265✔
1314
}
1315

1316
static int32_t getBlkFromGroupCache(struct SOperatorInfo* pOperator, SSDataBlock** ppRes, SOperatorParam* pParam) {
11,585,945✔
1317
  int32_t code = TSDB_CODE_SUCCESS;
11,585,945✔
1318
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
11,585,945✔
1319
  SGcOperatorParam* pGcParam = pParam->value;
11,585,945✔
1320
  SGcDownstreamCtx* pCtx = &pGCache->pDownstreams[pParam->downstreamIdx];
11,585,945✔
1321
  SGcSessionCtx* pSession = taosHashGet(pCtx->pSessions, &pGcParam->sessionId, sizeof(pGcParam->sessionId));
11,585,945✔
1322
  if (NULL == pSession) {
11,585,945✔
1323
    int32_t code = initGroupCacheSession(pOperator, pParam, &pSession);
7,609,480✔
1324
    if (TSDB_CODE_SUCCESS != code) {
7,609,480✔
1325
      return code;
×
1326
    }
1327
    if (NULL == pSession) {
7,609,480✔
1328
      qDebug("session %" PRId64 " in downstream %d total got 0 rows since downtream fetch done", pGcParam->sessionId, pCtx->id);
19,215✔
1329
      return TSDB_CODE_SUCCESS;
19,215✔
1330
    }
1331
  } else if (pSession->pGroupData->needCache) {
3,976,465✔
1332
    SSDataBlock** ppBlock = taosHashGet(pGCache->blkCache.pReadBlk, &pGcParam->sessionId, sizeof(pGcParam->sessionId));
3,967,105✔
1333
    if (ppBlock) {
3,967,105✔
1334
      QRY_ERR_RET(releaseBaseBlockToList(pCtx, *ppBlock));
3,849,884✔
1335
      code = taosHashRemove(pGCache->blkCache.pReadBlk, &pGcParam->sessionId, sizeof(pGcParam->sessionId));
3,849,884✔
1336
      if (code) {
3,849,884✔
1337
        qError("taosHashRemove session %" PRId64 " from pReadBlk failed, error: %s", pGcParam->sessionId, tstrerror(code));
×
1338
        QRY_ERR_RET(code);
×
1339
      }
1340
    }
1341
  }
1342
  
1343
  QRY_ERR_RET(getBlkFromSessionCache(pOperator, pGcParam->sessionId, pSession, ppRes));
11,566,730✔
1344
  if (NULL == *ppRes) {
11,566,730✔
1345
    qDebug("session %" PRId64 " in downstream %d total got %" PRId64 " rows", pGcParam->sessionId, pCtx->id, pSession->resRows);
3,980,059✔
1346
    code = taosHashRemove(pCtx->pSessions, &pGcParam->sessionId, sizeof(pGcParam->sessionId));
3,980,059✔
1347
    if (code) {
3,980,059✔
1348
      qError("taosHashRemove session %" PRId64 " from pSessions failed, error: %s", pGcParam->sessionId, tstrerror(code));
×
1349
      QRY_ERR_RET(code);
×
1350
    }
1351
  } else {
1352
    pSession->resRows += (*ppRes)->info.rows;
7,586,671✔
1353
    qDebug("session %" PRId64 " in downstream %d got %" PRId64 " rows in one block", pGcParam->sessionId, pCtx->id, (*ppRes)->info.rows);
7,586,671✔
1354
  }
1355

1356
  return code;
11,566,730✔
1357
}
1358

1359
static int32_t initGroupCacheExecInfo(SOperatorInfo*        pOperator) {
1,195,276✔
1360
  SGroupCacheOperatorInfo* pInfo = pOperator->info;
1,195,276✔
1361
  pInfo->execInfo.pDownstreamBlkNum = taosMemoryCalloc(pOperator->numOfDownstream, sizeof(int64_t));
1,195,276✔
1362
  if (NULL == pInfo->execInfo.pDownstreamBlkNum) {
1,195,276✔
1363
    return terrno;
×
1364
  }
1365
  return TSDB_CODE_SUCCESS;
1,195,276✔
1366
}
1367

1368
static void freeRemoveGroupCacheData(void* p) {
591,289✔
1369
  SGroupCacheData* pGroup = p;
591,289✔
1370
  if (pGroup->vgId > 0 && pGroup->needCache) {
591,289✔
1371
    SGcFileCacheCtx* pFileCtx = &pGroup->pVgCtx->fileCtx;
×
1372
    if (pGroup->fileId >= 0) {
×
1373
      SGroupCacheFileInfo* pFileInfo = taosHashGet(pFileCtx->pCacheFile, &pGroup->fileId, sizeof(pGroup->fileId));
×
1374
      uint32_t remainNum = atomic_sub_fetch_32(&pFileInfo->groupNum, 1);
×
1375

1376
      qTrace("FileId:%d-%d-%d sub group num to %u", pGroup->downstreamIdx, pGroup->vgId, pFileCtx->fileId, remainNum);
×
1377

1378
      if (0 == remainNum && pGroup->fileId != pFileCtx->fileId) {
×
1379
        removeGroupCacheFile(pFileInfo);
×
1380

1381
#if 0
1382
        /* debug only */
1383
        snprintf(&pFileCtx->baseFilename[pFileCtx->baseNameLen], sizeof(pFileCtx->baseFilename) - pFileCtx->baseNameLen, "_%d", pGroup->fileId);
1384
        taosRemoveFile(pFileCtx->baseFilename);
1385
        /* debug only */
1386
#endif
1387

1388
        qTrace("FileId:%d-%d-%d removed", pGroup->downstreamIdx, pGroup->vgId, pFileCtx->fileId);
×
1389
        //taosHashRemove(pFileCtx->pCacheFile, &pGroup->fileId, sizeof(pGroup->fileId));
1390
      }
1391
    }
1392
  }
1393

1394
  taosArrayDestroy(pGroup->waitQueue);
591,289✔
1395
  taosArrayDestroy(pGroup->blkList.pList);
591,289✔
1396
  (void)taosThreadMutexDestroy(&pGroup->mutex);
591,289✔
1397

1398
  qTrace("group removed");
591,289✔
1399
}
591,289✔
1400

1401

1402

1403
static int32_t initGroupCacheDownstreamCtx(SOperatorInfo*          pOperator) {
1,195,276✔
1404
  SGroupCacheOperatorInfo* pInfo = pOperator->info;
1,195,276✔
1405
  pInfo->pDownstreams = taosMemoryCalloc(pOperator->numOfDownstream, sizeof(*pInfo->pDownstreams));
1,195,276✔
1406
  if (NULL == pInfo->pDownstreams) {
1,195,276✔
1407
    return terrno;
×
1408
  }
1409
  pInfo->downstreamNum = pOperator->numOfDownstream;
1,195,276✔
1410

1411
  for (int32_t i = 0; i < pOperator->numOfDownstream; ++i) {
3,585,828✔
1412
    SGcDownstreamCtx* pCtx = &pInfo->pDownstreams[i];
2,390,552✔
1413
    pCtx->id = i;
2,390,552✔
1414
    pCtx->fetchSessionId = -1;
2,390,552✔
1415
    pCtx->lastBlkUid = 0;
2,390,552✔
1416
    pCtx->pVgTbHash = tSimpleHashInit(10, taosGetDefaultHashFunction(TSDB_DATA_TYPE_INT));
2,390,552✔
1417
    if (NULL == pCtx->pVgTbHash) {
2,390,552✔
1418
      return terrno;
×
1419
    }
1420
    tSimpleHashSetFreeFp(pCtx->pVgTbHash, freeSGcVgroupCtx);      
2,390,552✔
1421

1422
    if (pInfo->batchFetch) {
2,390,552✔
1423
      int32_t defaultVg = 0;
2,388,212✔
1424
      SGcVgroupCtx vgCtx = {0};
2,388,212✔
1425
      initGcVgroupCtx(pOperator, &vgCtx, pCtx->id, defaultVg, NULL);      
2,388,212✔
1426
      QRY_ERR_RET(tSimpleHashPut(pCtx->pVgTbHash, &defaultVg, sizeof(defaultVg), &vgCtx, sizeof(vgCtx)));
2,388,212✔
1427
    }
1428
    
1429
    pCtx->pNewGrpList = taosArrayInit(10, sizeof(SGcNewGroupInfo));
2,390,552✔
1430
    if (NULL == pCtx->pNewGrpList) {
2,390,552✔
1431
      return terrno;
×
1432
    }
1433
    if (!pInfo->globalGrp) {
2,390,552✔
1434
      pCtx->pGrpHash = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, HASH_ENTRY_LOCK);
2,390,552✔
1435
      if (pCtx->pGrpHash == NULL) {
2,390,552✔
1436
        return terrno;
×
1437
      }
1438
      taosHashSetFreeFp(pCtx->pGrpHash, freeRemoveGroupCacheData);      
2,390,552✔
1439
    }
1440

1441
    pCtx->pSessions = taosHashInit(20, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), false, HASH_ENTRY_LOCK);
2,390,552✔
1442
    if (pCtx->pSessions == NULL) {
2,390,552✔
1443
      return terrno;
×
1444
    }
1445
    taosHashSetFreeFp(pCtx->pSessions, freeSGcSessionCtx);
2,390,552✔
1446
  
1447
    pCtx->pFreeBlock = taosArrayInit(10, POINTER_BYTES);
2,390,552✔
1448
    if (NULL == pCtx->pFreeBlock) {
2,390,552✔
1449
      return terrno;
×
1450
    }
1451
    
1452
    pCtx->pWaitSessions = taosHashInit(20, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BIGINT), false, HASH_ENTRY_LOCK);
2,390,552✔
1453
    if (pCtx->pWaitSessions == NULL) {
2,390,552✔
1454
      return terrno;
×
1455
    }
1456

1457
    (void)snprintf(pCtx->fileCtx.baseFilename, sizeof(pCtx->fileCtx.baseFilename) - 1, "%s/gc_%d_%" PRIx64 "_%" PRIu64 "_%p_%d", 
7,171,656✔
1458
      tsTempDir, taosGetPId(), pOperator->pTaskInfo->id.queryId, pOperator->pTaskInfo->id.taskId, pOperator, pCtx->id);
4,781,104✔
1459
    pCtx->fileCtx.baseFilename[sizeof(pCtx->fileCtx.baseFilename) - 1] = 0;
2,390,552✔
1460
    pCtx->fileCtx.baseNameLen = strlen(pCtx->fileCtx.baseFilename);
2,390,552✔
1461
  }
1462

1463
  return TSDB_CODE_SUCCESS;
1,195,276✔
1464
}
1465

1466
static int32_t groupCacheGetNext(struct SOperatorInfo* pOperator, SOperatorParam* pParam, SSDataBlock** pRes) {
11,585,945✔
1467
  *pRes = NULL;
11,585,945✔
1468

1469
  SSDataBlock* pBlock = NULL;
11,585,945✔
1470
  int32_t      code = 0;
11,585,945✔
1471

1472
  code = getBlkFromGroupCache(pOperator, &pBlock, pParam);
11,585,945✔
1473
  if (TSDB_CODE_SUCCESS != code) {
11,585,945✔
UNCOV
1474
    pOperator->pTaskInfo->code = code;
×
UNCOV
1475
    T_LONG_JMP(pOperator->pTaskInfo->env, pOperator->pTaskInfo->code);
×
1476
  }
1477

1478
  *pRes = pBlock;
11,585,945✔
1479
  return code;
11,585,945✔
1480
}
1481

UNCOV
1482
static int32_t groupCacheTableCacheEnd(SOperatorInfo* pOperator, SOperatorParam* pParam) {
×
UNCOV
1483
  SGcNotifyOperatorParam* pGcParam = pParam->value;
×
UNCOV
1484
  SGroupCacheOperatorInfo* pGCache = pOperator->info;
×
UNCOV
1485
  SGcDownstreamCtx* pCtx = &pGCache->pDownstreams[pGcParam->downstreamIdx];
×
UNCOV
1486
  SHashObj* pGrpHash = pGCache->globalGrp ? pGCache->pGrpHash : pCtx->pGrpHash;
×
1487

UNCOV
1488
  qTrace("try to remove group %" PRIu64, pGcParam->tbUid);
×
UNCOV
1489
  if (taosHashRemove(pGrpHash, &pGcParam->tbUid, sizeof(pGcParam->tbUid))) {
×
UNCOV
1490
    qError("failed to remove group %" PRIu64 " in vgId %d downstreamIdx %d", pGcParam->tbUid, pGcParam->vgId, pGcParam->downstreamIdx);
×
1491
    return TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
×
1492
  }
1493

1494
  return TSDB_CODE_SUCCESS;
×
1495
}
1496

1497
static void resetGroupCacheBlockCache(SGcBlkCacheInfo* pCache) {
1,632✔
1498
  taosHashClear(pCache->pDirtyBlk);
1,632✔
1499

1500
  void* p = NULL;
1,632✔
1501
  while (NULL != (p = taosHashIterate(pCache->pReadBlk, p))) {
1,632✔
UNCOV
1502
    blockDataDeepCleanup(*(SSDataBlock**)p);
×
1503
    freeGcBlockInList(p);
×
1504
  }
1505

1506
  taosHashClear(pCache->pReadBlk);
1,632✔
1507

1508
  pCache->dirtyLock = 0;
1,632✔
1509
  pCache->pDirtyHead = NULL;
1,632✔
1510
  pCache->pDirtyTail = NULL;
1,632✔
1511
  pCache->blkCacheSize = 0;
1,632✔
1512
  pCache->writeDownstreamId = -1;
1,632✔
1513

1514
  return;
1,632✔
1515
}
1516

1517
static int32_t resetGroupCacheDownstreamCtx(SOperatorInfo* pOper) {
1,632✔
1518
  int32_t code = 0, lino = 0;
1,632✔
1519
  SGroupCacheOperatorInfo* pInfo = pOper->info;
1,632✔
1520
  if (NULL == pInfo->pDownstreams) {
1,632✔
UNCOV
1521
    return TSDB_CODE_SUCCESS;
×
1522
  }
1523
  
1524
  for (int32_t i = 0; i < pInfo->downstreamNum; ++i) {
4,896✔
1525
    SGcDownstreamCtx* pCtx = &pInfo->pDownstreams[i];
3,264✔
1526
    taosArrayClear(pCtx->pNewGrpList);
3,264✔
1527
    taosHashClear(pCtx->pGrpHash);
3,264✔
1528

1529
    tSimpleHashClear(pCtx->pVgTbHash);
3,264✔
1530
    if (pInfo->batchFetch) {
3,264✔
1531
      int32_t defaultVg = 0;
3,264✔
1532
      SGcVgroupCtx vgCtx = {0};
3,264✔
1533
      initGcVgroupCtx(pOper, &vgCtx, pCtx->id, defaultVg, NULL);      
3,264✔
1534
      TAOS_CHECK_EXIT(tSimpleHashPut(pCtx->pVgTbHash, &defaultVg, sizeof(defaultVg), &vgCtx, sizeof(vgCtx)));
3,264✔
1535
    }
1536
    
1537
    taosArrayClearEx(pCtx->pFreeBlock, freeGcBlockInList);
3,264✔
1538
    taosHashClear(pCtx->pSessions);
3,264✔
1539
    taosHashClear(pCtx->pWaitSessions);
3,264✔
1540
    freeSGcFileCacheCtx(&pCtx->fileCtx);
3,264✔
1541

1542
    pCtx->grpLock = 0;
3,264✔
1543
    pCtx->fetchSessionId = -1;
3,264✔
1544
    pCtx->blkLock = 0;
3,264✔
1545
    pCtx->lastBlkUid = 0;
3,264✔
1546
    pCtx->pBaseBlock = NULL;
3,264✔
1547
    pCtx->fetchDone = false;
3,264✔
1548
  }
1549

1550
_exit:
1,632✔
1551

1552
  if (code) {
1,632✔
UNCOV
1553
    qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
×
1554
  }
1555

1556
  return code;
1,632✔
1557
}
1558

1559
static int32_t resetGroupCacheOperState(SOperatorInfo* pOper) {
1,632✔
1560
  int32_t code = 0, lino = 0;
1,632✔
1561
  SGroupCacheOperatorInfo* pInfo = pOper->info;
1,632✔
1562

1563
  pOper->status = OP_NOT_OPENED;
1,632✔
1564

1565
  resetGroupCacheBlockCache(&pInfo->blkCache);
1,632✔
1566

1567
  taosHashClear(pInfo->pGrpHash);
1,632✔
1568

1569
  TAOS_CHECK_EXIT(resetGroupCacheDownstreamCtx(pOper));
1,632✔
1570

1571
  memset(pInfo->execInfo.pDownstreamBlkNum, 0, pOper->numOfDownstream * sizeof(int64_t));
1,632✔
1572
  
1573
_exit:
1,632✔
1574

1575
  if (code) {
1,632✔
UNCOV
1576
    qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
×
1577
  }
1578

1579
  return code;
1,632✔
1580
}
1581

1582
int32_t createGroupCacheOperatorInfo(SOperatorInfo** pDownstream, int32_t numOfDownstream,
1,195,276✔
1583
                                     SGroupCachePhysiNode* pPhyciNode, SExecTaskInfo* pTaskInfo,
1584
                                     SOperatorInfo** pOptrInfo) {
1585
  QRY_PARAM_CHECK(pOptrInfo);
1,195,276✔
1586
  int32_t code = TSDB_CODE_SUCCESS;
1,195,276✔
1587

1588
  SGroupCacheOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SGroupCacheOperatorInfo));
1,195,276✔
1589
  SOperatorInfo*           pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
1,195,276✔
1590
  if (pOperator == NULL || pInfo == NULL) {
1,195,276✔
UNCOV
1591
    code = terrno;
×
UNCOV
1592
    goto _error;
×
1593
  }
1594
  initOperatorCostInfo(pOperator);
1,195,276✔
1595

1596
  pOperator->transparent = true;
1,195,276✔
1597
  pOperator->pPhyNode = pPhyciNode;
1,195,276✔
1598
  
1599
  setOperatorInfo(pOperator, "GroupCacheOperator", QUERY_NODE_PHYSICAL_PLAN_GROUP_CACHE, false, OP_NOT_OPENED, pInfo, pTaskInfo);
1,195,276✔
1600

1601
  pInfo->maxCacheSize = 0;
1,195,276✔
1602
  pInfo->grpByUid = pPhyciNode->grpByUid;
1,195,276✔
1603
  pInfo->globalGrp = pPhyciNode->globalGrp;
1,195,276✔
1604
  pInfo->batchFetch = pPhyciNode->batchFetch;
1,195,276✔
1605
  
1606
  if (!pInfo->grpByUid) {
1,195,276✔
UNCOV
1607
    qError("only group cache by uid is supported now");
×
UNCOV
1608
    code = TSDB_CODE_INVALID_PARA;
×
UNCOV
1609
    goto _error;
×
1610
  }
1611
  
1612
  if (pPhyciNode->pGroupCols) {
1,195,276✔
UNCOV
1613
    code = initGroupColsInfo(&pInfo->groupColsInfo, pPhyciNode->grpColsMayBeNull, pPhyciNode->pGroupCols);
×
UNCOV
1614
    if (code) {
×
1615
      goto _error;
×
1616
    }
1617
  }
1618

1619
  code = initGroupCacheBlockCache(pInfo);
1,195,276✔
1620
  if (code) {
1,195,276✔
1621
    goto _error;
×
1622
  }
1623

1624
  if (pInfo->globalGrp) {
1,195,276✔
UNCOV
1625
    pInfo->pGrpHash = taosHashInit(32, taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY), false, HASH_ENTRY_LOCK);
×
UNCOV
1626
    if (pInfo->pGrpHash == NULL) {
×
UNCOV
1627
      code = terrno;
×
UNCOV
1628
      goto _error;
×
1629
    }
UNCOV
1630
    taosHashSetFreeFp(pInfo->pGrpHash, freeRemoveGroupCacheData);
×
1631
  }
1632

1633
  code = appendDownstream(pOperator, pDownstream, numOfDownstream);
1,195,276✔
1634
  if (TSDB_CODE_SUCCESS != code) {
1,195,276✔
1635
    goto _error;
×
1636
  }
1637

1638
  code = initGroupCacheDownstreamCtx(pOperator);
1,195,276✔
1639
  if (TSDB_CODE_SUCCESS != code) {
1,195,276✔
UNCOV
1640
    goto _error;
×
1641
  }
1642

1643
  code = initGroupCacheExecInfo(pOperator);
1,195,276✔
1644
  if (TSDB_CODE_SUCCESS != code) {
1,195,276✔
UNCOV
1645
    goto _error;
×
1646
  }
1647

1648
  pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, NULL, NULL, destroyGroupCacheOperator, optrDefaultBufFn, NULL, groupCacheGetNext, groupCacheTableCacheEnd);
1,195,276✔
1649

1650
  setOperatorResetStateFn(pOperator, resetGroupCacheOperState);
1,195,276✔
1651

1652
  qTrace("new group cache operator, maxCacheSize:%" PRId64 ", globalGrp:%d, batchFetch:%d", pInfo->maxCacheSize, pInfo->globalGrp, pInfo->batchFetch);
1,195,276✔
1653

1654
  *pOptrInfo = pOperator;
1,195,276✔
1655
  return TSDB_CODE_SUCCESS;
1,195,276✔
1656

UNCOV
1657
_error:
×
UNCOV
1658
  if (pInfo != NULL) {
×
UNCOV
1659
    destroyGroupCacheOperator(pInfo);
×
1660
  }
1661

UNCOV
1662
  destroyOperatorAndDownstreams(pOperator, pDownstream, numOfDownstream);
×
UNCOV
1663
  pTaskInfo->code = code;
×
UNCOV
1664
  return code;
×
1665
}
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc