• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

taosdata / TDengine / #5011

03 Apr 2026 03:59PM UTC coverage: 72.3% (+0.008%) from 72.292%
#5011

push

travis-ci

web-flow
merge: from main to 3.0 branch #35067

4053 of 5985 new or added lines in 68 files covered. (67.72%)

732 existing lines in 143 files now uncovered.

257430 of 356056 relevant lines covered (72.3%)

131834103.52 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

76.78
/source/libs/executor/src/groupoperator.c
1
/*
2
 * Copyright (c) 2019 TAOS Data, Inc. <jhtao@taosdata.com>
3
 *
4
 * This program is free software: you can use, redistribute, and/or modify
5
 * it under the terms of the GNU Affero General Public License, version 3
6
 * or later ("AGPL"), as published by the Free Software Foundation.
7
 *
8
 * This program is distributed in the hope that it will be useful, but WITHOUT
9
 * ANY WARRANTY; without even the implied warranty of MERCHANTABILITY or
10
 * FITNESS FOR A PARTICULAR PURPOSE.
11
 *
12
 * You should have received a copy of the GNU Affero General Public License
13
 * along with this program. If not, see <http://www.gnu.org/licenses/>.
14
 */
15

16
#include "filter.h"
17
#include "function.h"
18
#include "os.h"
19
#include "query.h"
20
#include "tname.h"
21
#include "tutil.h"
22

23
#include "tdatablock.h"
24
#include "tmsg.h"
25

26
#include "executorInt.h"
27
#include "operator.h"
28
#include "querytask.h"
29
#include "tcompare.h"
30
#include "thash.h"
31
#include "ttypes.h"
32

33
typedef struct SGroupbyOperatorInfo {
34
  SOptrBasicInfo binfo;
35
  SAggSupporter  aggSup;
36
  SArray*        pGroupCols;     // group by columns, SArray<SColumn>
37
  SArray*        pGroupColVals;  // current group column values, SArray<SGroupKeys>
38
  bool           isInit;         // denote if current val is initialized or not
39
  char*          keyBuf;         // group by keys for hash
40
  int32_t        groupKeyLen;    // total group by column width
41
  SGroupResInfo  groupResInfo;
42
  SExprSupp      scalarSup;
43
  SOperatorInfo  *pOperator;
44
  SLimitInfo     limitInfo;
45
} SGroupbyOperatorInfo;
46

47
// The sort in partition may be needed later.
48
typedef struct SPartitionOperatorInfo {
49
  SOptrBasicInfo binfo;
50
  SArray*        pGroupCols;
51
  SArray*        pGroupColVals;  // current group column values, SArray<SGroupKeys>
52
  char*          keyBuf;         // group by keys for hash
53
  int32_t        groupKeyLen;    // total group by column width
54
  SHashObj*      pGroupSet;      // quick locate the window object for each result
55

56
  SDiskbasedBuf* pBuf;              // query result buffer based on blocked-wised disk file
57
  int32_t        rowCapacity;       // maximum number of rows for each buffer page
58
  int32_t*       columnOffset;      // start position for each column data
59
  SArray*        sortedGroupArray;  // SDataGroupInfo sorted by group id
60
  int32_t        groupIndex;        // group index
61
  int32_t        pageIndex;         // page index of current group
62
  SExprSupp      scalarSup;
63

64
  int32_t remainRows;
65
  int32_t orderedRows;
66
  SArray* pOrderInfoArr;
67
} SPartitionOperatorInfo;
68

69
static void*    getCurrentDataGroupInfo(const SPartitionOperatorInfo* pInfo, SDataGroupInfo** pGroupInfo, int32_t len);
70
static int32_t* setupColumnOffset(const SSDataBlock* pBlock, int32_t rowCapacity);
71
static int32_t  setGroupResultOutputBuf(SOperatorInfo* pOperator, SOptrBasicInfo* binfo, int32_t numOfCols, char* pData,
72
                                        int32_t bytes, uint64_t groupId, SDiskbasedBuf* pBuf, SAggSupporter* pAggSup);
73
static int32_t  extractColumnInfo(SNodeList* pNodeList, SArray** pArrayRes);
74
static int32_t  getPartitionPageRowCapacity(const SSDataBlock* pBlock, size_t pageSize, int32_t extraSize);
75

76
static void freeGroupKey(void* param) {
48,727,710✔
77
  SGroupKeys* pKey = (SGroupKeys*)param;
48,727,710✔
78
  taosMemoryFree(pKey->pData);
48,727,710✔
79
}
48,725,218✔
80

81
static void destroyGroupOperatorInfo(void* param) {
31,572,735✔
82
  if (param == NULL) {
31,572,735✔
83
    return;
×
84
  }
85
  SGroupbyOperatorInfo* pInfo = (SGroupbyOperatorInfo*)param;
31,572,735✔
86

87
  cleanupBasicInfo(&pInfo->binfo);
31,572,735✔
88
  taosMemoryFreeClear(pInfo->keyBuf);
31,571,141✔
89
  taosArrayDestroy(pInfo->pGroupCols);
31,570,313✔
90
  taosArrayDestroyEx(pInfo->pGroupColVals, freeGroupKey);
31,571,550✔
91
  cleanupExprSupp(&pInfo->scalarSup);
31,569,080✔
92

93
  if (pInfo->pOperator != NULL) {
31,572,169✔
94
    cleanupResultInfo(pInfo->pOperator->pTaskInfo, &pInfo->pOperator->exprSupp, &pInfo->groupResInfo, &pInfo->aggSup,
31,480,829✔
95
                      false);
96
    pInfo->pOperator = NULL;
31,478,211✔
97
  }
98

99
  cleanupGroupResInfo(&pInfo->groupResInfo);
31,570,111✔
100
  cleanupAggSup(&pInfo->aggSup);
31,570,641✔
101
  taosMemoryFreeClear(param);
31,569,749✔
102
}
103

104
static int32_t getPartitionPageRowCapacity(const SSDataBlock* pBlock, size_t pageSize, int32_t extraSize) {
3,004,988✔
105
  size_t  numOfCols = taosArrayGetSize(pBlock->pDataBlock);
3,004,988✔
106
  int32_t payloadSize = pageSize - extraSize;
3,005,242✔
107
  int32_t payloadRowSize = 0;
3,005,242✔
108
  int32_t numVarCols = 0;
3,005,242✔
109
  int32_t numFixCols = 0;
3,005,242✔
110

111
  for (int32_t i = 0; i < numOfCols; ++i) {
12,603,366✔
112
    SColumnInfoData* pCol = taosArrayGet(pBlock->pDataBlock, i);
9,599,084✔
113
    if (pCol == NULL) {
9,588,707✔
NEW
114
      terrno = TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
×
NEW
115
      return -1;
×
116
    }
117

118
    payloadRowSize += blockDataGetPagedColumnReservedBytes(pCol);
9,588,707✔
119
    if (IS_VAR_DATA_TYPE(pCol->info.type)) {
9,595,041✔
120
      ++numVarCols;
1,352,612✔
121
    } else {
122
      ++numFixCols;
8,245,512✔
123
    }
124
  }
125

126
  int32_t nRows = payloadSize / payloadRowSize;
3,004,282✔
127
  if (nRows < 1) {
3,004,282✔
NEW
128
    uError("rows %d in page is too small, payloadSize:%d, rowSize:%d", nRows, payloadSize, payloadRowSize);
×
NEW
129
    terrno = TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR;
×
NEW
130
    return -1;
×
131
  }
132

133
  int32_t result = -1;
3,004,282✔
134
  int32_t start = 1;
3,004,282✔
135
  int32_t end = nRows;
3,004,282✔
136
  while (start <= end) {
25,803,961✔
137
    int32_t mid = start + (end - start) / 2;
22,799,679✔
138
    int32_t midSize = payloadRowSize * mid + numVarCols * sizeof(int32_t) * mid + numFixCols * BitmapLen(mid);
22,799,679✔
139
    if (midSize > payloadSize) {
22,799,679✔
140
      result = mid;
4,522,381✔
141
      end = mid - 1;
4,522,381✔
142
    } else {
143
      start = mid + 1;
18,277,298✔
144
    }
145
  }
146

147
  return (result != -1) ? result - 1 : nRows;
3,004,282✔
148
}
149

150
static int32_t initGroupOptrInfo(SArray** pGroupColVals, int32_t* keyLen, char** keyBuf, const SArray* pGroupColList) {
34,481,561✔
151
  *pGroupColVals = taosArrayInit(4, sizeof(SGroupKeys));
34,481,561✔
152
  if ((*pGroupColVals) == NULL) {
34,473,009✔
153
    return terrno;
×
154
  }
155

156
  int32_t numOfGroupCols = taosArrayGetSize(pGroupColList);
34,477,012✔
157
  for (int32_t i = 0; i < numOfGroupCols; ++i) {
87,017,382✔
158
    SColumn* pCol = (SColumn*)taosArrayGet(pGroupColList, i);
52,538,827✔
159
    if (!pCol) {
52,541,686✔
160
      qError("%s failed at line %d since %s", __func__, __LINE__, tstrerror(terrno));
×
161
      return terrno;
×
162
    }
163
    (*keyLen) += pCol->bytes;  // actual data + null_flag
52,541,686✔
164

165
    SGroupKeys key = {0};
52,533,272✔
166
    key.bytes = pCol->bytes;
52,535,327✔
167
    key.type = pCol->type;
52,538,148✔
168
    key.isNull = false;
52,531,376✔
169
    key.pData = taosMemoryCalloc(1, pCol->bytes);
52,531,376✔
170
    if (key.pData == NULL) {
52,534,999✔
171
      return terrno;
×
172
    }
173

174
    void* tmp = taosArrayPush((*pGroupColVals), &key);
52,534,999✔
175
    if (!tmp) {
52,543,535✔
176
      return terrno;
×
177
    }
178
  }
179

180
  int32_t nullFlagSize = sizeof(int8_t) * numOfGroupCols;
34,478,555✔
181
  (*keyLen) += nullFlagSize;
34,478,555✔
182

183
  (*keyBuf) = taosMemoryCalloc(1, (*keyLen));
34,479,167✔
184
  if ((*keyBuf) == NULL) {
34,468,633✔
185
    return terrno;
×
186
  }
187

188
  return TSDB_CODE_SUCCESS;
34,478,133✔
189
}
190

191
static bool groupKeyCompare(SArray* pGroupCols, SArray* pGroupColVals, SSDataBlock* pBlock, int32_t rowIndex,
2,147,483,647✔
192
                            int32_t numOfGroupCols) {
193
  SColumnDataAgg* pColAgg = NULL;
2,147,483,647✔
194
  for (int32_t i = 0; i < numOfGroupCols; ++i) {
2,147,483,647✔
195
    SColumn*         pCol = taosArrayGet(pGroupCols, i);
2,147,483,647✔
196
    SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, pCol->slotId);
2,147,483,647✔
197
    if (pBlock->pBlockAgg != NULL) {
2,147,483,647✔
198
      pColAgg = &pBlock->pBlockAgg[pCol->slotId];  // TODO is agg data matched?
×
199
    }
200

201
    bool isNull = colDataIsNull(pColInfoData, pBlock->info.rows, rowIndex, pColAgg);
2,147,483,647✔
202

203
    SGroupKeys* pkey = taosArrayGet(pGroupColVals, i);
2,147,483,647✔
204
    if (pkey->isNull && isNull) {
2,147,483,647✔
205
      continue;
2,147,483,647✔
206
    }
207

208
    if (isNull || pkey->isNull) {
2,147,483,647✔
209
      return false;
2,147,483,647✔
210
    }
211

212
    char* val = colDataGetData(pColInfoData, rowIndex);
2,147,483,647✔
213

214
    if (pkey->type == TSDB_DATA_TYPE_JSON) {
2,147,483,647✔
215
      int32_t dataLen = getJsonValueLen(val);
6,986✔
216

217
      if (memcmp(pkey->pData, val, dataLen) == 0) {
6,986✔
218
        continue;
998✔
219
      } else {
220
        return false;
5,988✔
221
      }
222
    } else if (IS_VAR_DATA_TYPE(pkey->type)) {
2,147,483,647✔
223
      if (IS_STR_DATA_BLOB(pkey->type)) {
2,147,483,647✔
UNCOV
224
        int32_t len = blobDataLen(val);
×
225
        if (len == blobDataLen(pkey->pData) && memcmp(blobDataVal(pkey->pData), blobDataVal(val), len) == 0) {
×
226
          continue;
×
227
        } else {
228
          return false;
×
229
        }
230
      } else {
231
        int32_t len = varDataLen(val);
2,147,483,647✔
232
        if (len == varDataLen(pkey->pData) && memcmp(varDataVal(pkey->pData), varDataVal(val), len) == 0) {
2,147,483,647✔
233
          continue;
2,147,483,647✔
234
        } else {
235
          return false;
1,147,794,339✔
236
        }
237
      }
238
    } else {
239
      if (memcmp(pkey->pData, val, pkey->bytes) != 0) {
2,147,483,647✔
240
        return false;
2,147,483,647✔
241
      }
242
    }
243
  }
244

245
  return true;
2,147,483,647✔
246
}
247

248
static void recordNewGroupKeys(SArray* pGroupCols, SArray* pGroupColVals, SSDataBlock* pBlock, int32_t rowIndex) {
2,147,483,647✔
249
  SColumnDataAgg* pColAgg = NULL;
2,147,483,647✔
250

251
  size_t numOfGroupCols = taosArrayGetSize(pGroupCols);
2,147,483,647✔
252

253
  for (int32_t i = 0; i < numOfGroupCols; ++i) {
2,147,483,647✔
254
    SColumn*         pCol = (SColumn*)taosArrayGet(pGroupCols, i);
2,147,483,647✔
255
    SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, pCol->slotId);
2,147,483,647✔
256

257
    // valid range check. todo: return error code.
258
    if (pCol->slotId > taosArrayGetSize(pBlock->pDataBlock)) {
2,147,483,647✔
259
      continue;
×
260
    }
261

262
    if (pBlock->pBlockAgg != NULL) {
2,147,483,647✔
263
      pColAgg = &pBlock->pBlockAgg[pCol->slotId];  // TODO is agg data matched?
×
264
    }
265

266
    SGroupKeys* pkey = taosArrayGet(pGroupColVals, i);
2,147,483,647✔
267
    if (colDataIsNull(pColInfoData, pBlock->info.rows, rowIndex, pColAgg)) {
2,147,483,647✔
268
      pkey->isNull = true;
2,147,483,647✔
269
    } else {
270
      pkey->isNull = false;
2,147,483,647✔
271
      char* val = colDataGetData(pColInfoData, rowIndex);
2,147,483,647✔
272
      if (pkey->type == TSDB_DATA_TYPE_JSON) {
2,147,483,647✔
273
        // if (tTagIsJson(val)) {
274
        //   terrno = TSDB_CODE_QRY_JSON_IN_GROUP_ERROR;
275
        //   return;
276
        // }
277
        int32_t dataLen = getJsonValueLen(val);
40,967✔
278
        memcpy(pkey->pData, val, dataLen);
41,774✔
279
      } else if (IS_VAR_DATA_TYPE(pkey->type)) {
2,147,483,647✔
280
        if (IS_STR_DATA_BLOB(pkey->type)) {
2,147,483,647✔
281
          memcpy(pkey->pData, val, blobDataTLen(val));
2,435✔
282
        } else {
283
          memcpy(pkey->pData, val, varDataTLen(val));
2,147,483,647✔
284
        }
285
      } else {
286
        memcpy(pkey->pData, val, pkey->bytes);
2,147,483,647✔
287
      }
288
    }
289
  }
290
}
2,147,483,647✔
291

292
static int32_t buildGroupKeys(void* pKey, const SArray* pGroupColVals) {
2,147,483,647✔
293
  size_t numOfGroupCols = taosArrayGetSize(pGroupColVals);
2,147,483,647✔
294

295
  char* isNull = (char*)pKey;
2,147,483,647✔
296
  char* pStart = (char*)pKey + sizeof(int8_t) * numOfGroupCols;
2,147,483,647✔
297
  for (int32_t i = 0; i < numOfGroupCols; ++i) {
2,147,483,647✔
298
    SGroupKeys* pkey = taosArrayGet(pGroupColVals, i);
2,147,483,647✔
299
    if (pkey->isNull) {
2,147,483,647✔
300
      isNull[i] = 1;
2,147,483,647✔
301
      continue;
2,147,483,647✔
302
    }
303

304
    isNull[i] = 0;
2,147,483,647✔
305
    if (pkey->type == TSDB_DATA_TYPE_JSON) {
2,147,483,647✔
306
      int32_t dataLen = getJsonValueLen(pkey->pData);
40,967✔
307
      memcpy(pStart, (pkey->pData), dataLen);
40,967✔
308
      pStart += dataLen;
40,967✔
309
    } else if (IS_VAR_DATA_TYPE(pkey->type)) {
2,147,483,647✔
310
      if (IS_STR_DATA_BLOB(pkey->type)) {
2,147,483,647✔
311
        blobDataCopy(pStart, pkey->pData);
748✔
312
        pStart += blobDataTLen(pkey->pData);
×
313
      } else {
314
        varDataCopy(pStart, pkey->pData);
2,147,483,647✔
315
        pStart += varDataTLen(pkey->pData);
2,147,483,647✔
316
      }
317
    } else {
318
      memcpy(pStart, pkey->pData, pkey->bytes);
2,147,483,647✔
319
      pStart += pkey->bytes;
2,147,483,647✔
320
    }
321
  }
322

323
  return (int32_t)(pStart - (char*)pKey);
2,147,483,647✔
324
}
325

326
// assign the group keys or user input constant values if required
327
static void doAssignGroupKeys(SqlFunctionCtx* pCtx, int32_t numOfOutput, int32_t totalRows, int32_t rowIndex) {
2,147,483,647✔
328
  for (int32_t i = 0; i < numOfOutput; ++i) {
2,147,483,647✔
329
    if (pCtx[i].functionId == -1) {  // select count(*),key from t group by key.
2,147,483,647✔
330
      SResultRowEntryInfo* pEntryInfo = GET_RES_INFO(&pCtx[i]);
2,147,483,647✔
331

332
      SColumnInfoData* pColInfoData = pCtx[i].input.pData[0];
2,147,483,647✔
333
      // todo OPT all/all not NULL
334
      if (!colDataIsNull(pColInfoData, totalRows, rowIndex, NULL)) {
2,147,483,647✔
335
        char* dest = GET_ROWCELL_INTERBUF(pEntryInfo);
2,147,483,647✔
336
        char* data = colDataGetData(pColInfoData, rowIndex);
2,147,483,647✔
337

338
        if (pColInfoData->info.type == TSDB_DATA_TYPE_JSON) {
2,147,483,647✔
339
          int32_t dataLen = getJsonValueLen(data);
15,950✔
340
          memcpy(dest, data, dataLen);
15,950✔
341
        } else if (IS_VAR_DATA_TYPE(pColInfoData->info.type)) {
2,147,483,647✔
342
          if (IS_STR_DATA_BLOB(pColInfoData->info.type)) {
1,643,598,950✔
UNCOV
343
            blobDataCopy(dest, data);
×
344
          } else {
345
            varDataCopy(dest, data);
1,648,282,274✔
346
          }
347
        } else {
348
          memcpy(dest, data, pColInfoData->info.bytes);
2,147,483,647✔
349
        }
350
      } else {  // it is a NULL value
351
        pEntryInfo->isNullRes = 1;
2,147,483,647✔
352
      }
353

354
      pEntryInfo->numOfRes = 1;
2,147,483,647✔
355
    }
356
  }
357
}
2,147,483,647✔
358

359
static void doHashGroupbyAgg(SOperatorInfo* pOperator, SSDataBlock* pBlock) {
235,193,741✔
360
  SExecTaskInfo*        pTaskInfo = pOperator->pTaskInfo;
235,193,741✔
361
  SGroupbyOperatorInfo* pInfo = pOperator->info;
235,199,210✔
362

363
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
235,201,331✔
364
  int32_t         numOfGroupCols = taosArrayGetSize(pInfo->pGroupCols);
235,202,736✔
365
  //  if (type == TSDB_DATA_TYPE_FLOAT || type == TSDB_DATA_TYPE_DOUBLE) {
366
  //  qError("QInfo:0x%" PRIx64 ", group by not supported on double/float columns, abort", GET_TASKID(pRuntimeEnv));
367
  //    return;
368
  //  }
369

370
  int32_t len = 0;
235,201,314✔
371
  terrno = TSDB_CODE_SUCCESS;
235,201,314✔
372

373
  int32_t num = 0;
235,199,962✔
374
  for (int32_t j = 0; j < pBlock->info.rows; ++j) {
2,147,483,647✔
375
    // Compare with the previous row of this column, and do not set the output buffer again if they are identical.
376
    if (!pInfo->isInit) {
2,147,483,647✔
377
      recordNewGroupKeys(pInfo->pGroupCols, pInfo->pGroupColVals, pBlock, j);
23,639,943✔
378
      pInfo->isInit = true;
23,643,223✔
379
      num++;
23,641,756✔
380
      continue;
23,641,756✔
381
    }
382

383
    bool equal = groupKeyCompare(pInfo->pGroupCols, pInfo->pGroupColVals, pBlock, j, numOfGroupCols);
2,147,483,647✔
384
    if (equal) {
2,147,483,647✔
385
      num++;
2,147,483,647✔
386
      continue;
2,147,483,647✔
387
    }
388

389
    // The first row of a new block does not belongs to the previous existed group
390
    if (j == 0) {
2,147,483,647✔
391
      recordNewGroupKeys(pInfo->pGroupCols, pInfo->pGroupColVals, pBlock, j);
206,142,547✔
392
      num = 1;
206,138,241✔
393
      continue;
206,138,241✔
394
    }
395

396
    len = buildGroupKeys(pInfo->keyBuf, pInfo->pGroupColVals);
2,147,483,647✔
397
    int32_t ret = setGroupResultOutputBuf(pOperator, &(pInfo->binfo), pOperator->exprSupp.numOfExprs, pInfo->keyBuf,
2,147,483,647✔
398
                                          len, pBlock->info.id.groupId, pInfo->aggSup.pResultBuf, &pInfo->aggSup);
399
    if (ret != TSDB_CODE_SUCCESS) {  // null data, too many state code
2,147,483,647✔
400
      T_LONG_JMP(pTaskInfo->env, ret);
×
401
    }
402

403
    int32_t rowIndex = j - num;
2,147,483,647✔
404
    ret = applyAggFunctionOnPartialTuples(pTaskInfo, pCtx, NULL, rowIndex, num, pBlock->info.rows,
2,147,483,647✔
405
                                          pOperator->exprSupp.numOfExprs);
406
    if (ret != TSDB_CODE_SUCCESS) {
2,147,483,647✔
407
      T_LONG_JMP(pTaskInfo->env, ret);
×
408
    }
409

410
    // assign the group keys or user input constant values if required
411
    doAssignGroupKeys(pCtx, pOperator->exprSupp.numOfExprs, pBlock->info.rows, rowIndex);
2,147,483,647✔
412
    recordNewGroupKeys(pInfo->pGroupCols, pInfo->pGroupColVals, pBlock, j);
2,147,483,647✔
413
    num = 1;
2,147,483,647✔
414
  }
415

416
  // The data of the last group is processed here, and if there is only one group, it is also processed here.
417
  if (num > 0) {
235,198,041✔
418
    len = buildGroupKeys(pInfo->keyBuf, pInfo->pGroupColVals);
235,199,477✔
419
    int32_t ret = setGroupResultOutputBuf(pOperator, &(pInfo->binfo), pOperator->exprSupp.numOfExprs, pInfo->keyBuf,
235,197,069✔
420
                                          len, pBlock->info.id.groupId, pInfo->aggSup.pResultBuf, &pInfo->aggSup);
421
    if (ret != TSDB_CODE_SUCCESS) {
235,189,680✔
422
      T_LONG_JMP(pTaskInfo->env, ret);
×
423
    }
424

425
    int32_t rowIndex = pBlock->info.rows - num;
235,189,680✔
426
    ret = applyAggFunctionOnPartialTuples(pTaskInfo, pCtx, NULL, rowIndex, num, pBlock->info.rows,
235,191,411✔
427
                                          pOperator->exprSupp.numOfExprs);
428
    if (ret != TSDB_CODE_SUCCESS) {
235,185,655✔
429
      T_LONG_JMP(pTaskInfo->env, ret);
×
430
    }
431
    doAssignGroupKeys(pCtx, pOperator->exprSupp.numOfExprs, pBlock->info.rows, rowIndex);
235,185,655✔
432
  }
433
}
235,187,673✔
434

435
bool hasRemainResultByHash(SOperatorInfo* pOperator) {
2,147,483,647✔
436
  SGroupbyOperatorInfo* pInfo = pOperator->info;
2,147,483,647✔
437
  SSHashObj*            pHashmap = pInfo->aggSup.pResultRowHashTable;
2,147,483,647✔
438
  return pInfo->groupResInfo.index < tSimpleHashGetSize(pHashmap);
2,147,483,647✔
439
}
440

441
void doBuildResultDatablockByHash(SOperatorInfo* pOperator, SOptrBasicInfo* pbInfo, SGroupResInfo* pGroupResInfo,
2,141,747,018✔
442
                                  SDiskbasedBuf* pBuf) {
443
  SGroupbyOperatorInfo* pInfo = pOperator->info;
2,141,747,018✔
444
  SSHashObj*            pHashmap = pInfo->aggSup.pResultRowHashTable;
2,141,748,889✔
445
  SExecTaskInfo*        pTaskInfo = pOperator->pTaskInfo;
2,141,748,889✔
446

447
  SSDataBlock* pBlock = pInfo->binfo.pRes;
2,141,748,889✔
448

449
  // set output datablock version
450
  pBlock->info.version = pTaskInfo->version;
2,141,745,483✔
451

452
  blockDataCleanup(pBlock);
2,141,748,730✔
453
  if (!hasRemainResultByHash(pOperator)) {
2,141,750,307✔
454
    return;
7,793,611✔
455
  }
456

457
  pBlock->info.id.groupId = 0;
2,133,952,351✔
458
  pBlock->info.id.baseGId = 0;
2,133,952,429✔
459
  if (!pInfo->binfo.mergeResultBlock) {
2,133,952,429✔
460
    doCopyToSDataBlockByHash(pTaskInfo, pBlock, &pOperator->exprSupp, pInfo->aggSup.pResultBuf, &pInfo->groupResInfo,
2,116,354,699✔
461
                             pHashmap, pOperator->resultInfo.threshold, false);
462
  } else {
463
    while (hasRemainResultByHash(pOperator)) {
35,181,168✔
464
      doCopyToSDataBlockByHash(pTaskInfo, pBlock, &pOperator->exprSupp, pInfo->aggSup.pResultBuf, &pInfo->groupResInfo,
17,598,828✔
465
                               pHashmap, pOperator->resultInfo.threshold, true);
466
      if (pBlock->info.rows >= pOperator->resultInfo.threshold) {
17,598,828✔
467
        break;
16,488✔
468
      }
469
      pBlock->info.id.groupId = 0;
17,582,340✔
470
      pBlock->info.id.baseGId = 0;
17,582,340✔
471
    }
472

473
    // clear the group id info in SSDataBlock, since the client does not need it
474
    pBlock->info.id.groupId = 0;
17,599,359✔
475
    pBlock->info.id.baseGId = 0;
17,599,359✔
476
  }
477
}
478

479
static bool slimitReached(SLimitInfo* pLimitInfo) {
2,110,405,712✔
480
  if (pLimitInfo && pLimitInfo->slimit.limit >= 0 &&
2,110,405,712✔
481
      pLimitInfo->numOfOutputGroups >= pLimitInfo->slimit.limit) {
70,712✔
482
    return true;  // limit reached, stop processing further rows
24,385✔
483
  }
484
  return false;
2,110,381,833✔
485
}
486

487
static int32_t doGroupResultSlimit(SSDataBlock* pRes, SLimitInfo* pLimitInfo) {
2,141,751,037✔
488
  int32_t code = TSDB_CODE_SUCCESS;
2,141,751,037✔
489
  int32_t lino = 0;
2,141,751,037✔
490

491
  if (pRes == NULL || pRes->info.rows == 0 || !pLimitInfo) {
2,141,751,037✔
492
    return TSDB_CODE_SUCCESS;
7,905,314✔
493
  }
494

495
  if (pLimitInfo->remainGroupOffset > 0) {
2,133,845,723✔
496
    if (pRes->info.rows <= pLimitInfo->remainGroupOffset) {
77,581✔
497
      pLimitInfo->remainGroupOffset -= pRes->info.rows;
19,685✔
498
      blockDataCleanup(pRes);
19,685✔
499
      return TSDB_CODE_SUCCESS;
19,685✔
500
    } else {
501
      code = blockDataTrimFirstRows(pRes, pLimitInfo->remainGroupOffset);
57,896✔
502
      QUERY_CHECK_CODE(code, lino, _end);
57,896✔
503
      pLimitInfo->remainGroupOffset = 0;
57,896✔
504
    }
505
  }
506

507
  if (pLimitInfo->slimit.limit >= 0 && pRes->info.rows > 0) {
2,133,826,038✔
508
    int32_t remainRows = pLimitInfo->slimit.limit - pLimitInfo->numOfOutputGroups;
203,331✔
509
    if (pRes->info.rows > remainRows) {
203,331✔
510
      blockDataKeepFirstNRows(pRes, remainRows);
77,402✔
511
    }
512
    pLimitInfo->numOfOutputGroups += pRes->info.rows;
203,331✔
513
  }
514

515
_end:
2,133,623,213✔
516
  if (code != TSDB_CODE_SUCCESS) {
2,133,826,544✔
517
    qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
×
518
  }
519
  return code;
2,133,826,544✔
520
}
521

522
static SSDataBlock* buildGroupResultDataBlockByHash(SOperatorInfo* pOperator) {
2,141,742,275✔
523
  int32_t               code = TSDB_CODE_SUCCESS;
2,141,742,275✔
524
  int32_t               lino = 0;
2,141,742,275✔
525
  SExecTaskInfo*        pTaskInfo = pOperator->pTaskInfo;
2,141,742,275✔
526
  SGroupbyOperatorInfo* pInfo = pOperator->info;
2,141,745,066✔
527
  SSDataBlock*          pRes = pInfo->binfo.pRes;
2,141,743,398✔
528
  SLimitInfo*           pLimitInfo = &pInfo->limitInfo;
2,141,745,067✔
529

530
  // after filter, if result block turn to null, get next from whole set
531
  while (1) {
532
    doBuildResultDatablockByHash(pOperator, &pInfo->binfo, &pInfo->groupResInfo, pInfo->aggSup.pResultBuf);
2,141,745,781✔
533

534
    code = doFilter(pRes, pOperator->exprSupp.pFilterInfo, NULL, NULL);
2,141,750,560✔
535
    QUERY_CHECK_CODE(code, lino, _end);
2,141,751,568✔
536

537
    code = doGroupResultSlimit(pRes, pLimitInfo);
2,141,751,568✔
538
    QUERY_CHECK_CODE(code, lino, _end);
2,141,751,543✔
539

540
    if (!hasRemainResultByHash(pOperator) || slimitReached(pLimitInfo)) {
2,141,751,543✔
541
      setOperatorCompleted(pOperator);
31,370,747✔
542
      // clean hash after completed
543
      tSimpleHashCleanup(pInfo->aggSup.pResultRowHashTable);
31,370,241✔
544
      pInfo->aggSup.pResultRowHashTable = NULL;
31,369,710✔
545
      break;
31,368,619✔
546
    }
547

548
    if (pRes->info.rows > 0) {
2,110,381,327✔
549
      break;
2,110,380,132✔
550
    }
551
  }
552

553
_end:
2,141,748,751✔
554
  if (code != TSDB_CODE_SUCCESS) {
2,141,748,751✔
555
    qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
×
556
    T_LONG_JMP(pTaskInfo->env, code);
×
557
  }
558
  return (pRes->info.rows == 0) ? NULL : pRes;
2,141,748,751✔
559
}
560

561
static int32_t hashGroupbyAggregateNext(SOperatorInfo* pOperator, SSDataBlock** ppRes) {
2,147,483,647✔
562
  int32_t               code = TSDB_CODE_SUCCESS;
2,147,483,647✔
563
  int32_t               lino = 0;
2,147,483,647✔
564
  SExecTaskInfo*        pTaskInfo = pOperator->pTaskInfo;
2,147,483,647✔
565
  SGroupbyOperatorInfo* pInfo = pOperator->info;
2,147,483,647✔
566
  SGroupResInfo*        pGroupResInfo = &pInfo->groupResInfo;
2,147,483,647✔
567
  int32_t               order = pInfo->binfo.inputTsOrder;
2,147,483,647✔
568

569
  QRY_PARAM_CHECK(ppRes);
2,147,483,647✔
570
  if (pOperator->status == OP_EXEC_DONE) {
2,147,483,647✔
571
    return code;
23,353,780✔
572
  }
573

574
  if (pOperator->status == OP_RES_TO_RETURN) {
2,141,760,979✔
575
    (*ppRes) = buildGroupResultDataBlockByHash(pOperator);
2,110,299,561✔
576
    return code;
2,110,303,169✔
577
  }
578

579
  while (1) {
235,187,349✔
580
    SSDataBlock* pBlock = getNextBlockFromDownstream(pOperator, 0);
266,652,013✔
581
    if (pBlock == NULL) {
266,660,516✔
582
      break;
31,446,003✔
583
    }
584

585
    pInfo->binfo.pRes->info.scanFlag = pBlock->info.scanFlag;
235,214,513✔
586

587
    // the pDataBlock are always the same one, no need to call this again
588
    code = setInputDataBlock(&pOperator->exprSupp, pBlock, order, pBlock->info.scanFlag, true);
235,224,730✔
589
    QUERY_CHECK_CODE(code, lino, _end);
235,220,610✔
590

591
    // there is an scalar expression that needs to be calculated right before apply the group aggregation.
592
    if (pInfo->scalarSup.pExprInfo != NULL) {
235,220,610✔
593
      code = projectApplyFunctions(pInfo->scalarSup.pExprInfo, pBlock, pBlock, pInfo->scalarSup.pCtx,
43,374,408✔
594
                                   pInfo->scalarSup.numOfExprs, NULL, GET_STM_RTINFO(pOperator->pTaskInfo));
43,379,733✔
595
      QUERY_CHECK_CODE(code, lino, _end);
43,372,062✔
596
    }
597

598
    doHashGroupbyAgg(pOperator, pBlock);
235,193,339✔
599
  }
600

601
  pOperator->status = OP_RES_TO_RETURN;
31,446,003✔
602

603
  // initGroupedResultInfo(&pInfo->groupResInfo, pInfo->aggSup.pResultRowHashTable, 0);
604
  if (pGroupResInfo->pRows != NULL) {
31,446,534✔
605
    taosArrayDestroy(pGroupResInfo->pRows);
×
606
  }
607

608
  if (pGroupResInfo->pBuf) {
31,446,003✔
609
    taosMemoryFree(pGroupResInfo->pBuf);
×
610
    pGroupResInfo->pBuf = NULL;
×
611
  }
612

613
  pGroupResInfo->index = 0;
31,446,003✔
614
  pGroupResInfo->iter = 0;
31,446,003✔
615
  pGroupResInfo->dataPos = NULL;
31,446,004✔
616

617
_end:
31,465,565✔
618
  if (code != TSDB_CODE_SUCCESS) {
31,465,565✔
619
    qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
19,600✔
620
    pTaskInfo->code = code;
19,600✔
621
    T_LONG_JMP(pTaskInfo->env, code);
19,600✔
622
  } else {
623
    (*ppRes) = buildGroupResultDataBlockByHash(pOperator);
31,445,965✔
624
  }
625

626
  return code;
31,444,913✔
627
}
628

629
static int32_t resetGroupOperState(SOperatorInfo* pOper) {
×
630
  SGroupbyOperatorInfo* pInfo = pOper->info;
×
631
  SExecTaskInfo*           pTaskInfo = pOper->pTaskInfo;
×
632
  SAggPhysiNode* pPhynode = (SAggPhysiNode*)pOper->pPhyNode;
×
633
  resetBasicOperatorState(&pInfo->binfo);
×
634
  pOper->status = OP_NOT_OPENED;
×
635

636
  cleanupResultInfo(pInfo->pOperator->pTaskInfo, &pInfo->pOperator->exprSupp, &pInfo->groupResInfo, &pInfo->aggSup,
×
637
    false);
638

639
  cleanupGroupResInfo(&pInfo->groupResInfo);
×
640

641
  qInfo("[group key] len use:%d", pInfo->groupKeyLen);
×
642
  int32_t code = resetAggSup(&pOper->exprSupp, &pInfo->aggSup, pTaskInfo, pPhynode->pAggFuncs, pPhynode->pGroupKeys,
×
643
    pInfo->groupKeyLen + POINTER_BYTES, pTaskInfo->id.str, NULL,
×
644
    &pTaskInfo->storageAPI.functionStore);
645

646
  if (code == 0){
×
647
    code = resetExprSupp(&pInfo->scalarSup, pTaskInfo, pPhynode->pExprs, NULL,
×
648
      &pTaskInfo->storageAPI.functionStore);
649
  }
650

651
  pInfo->isInit = false;
×
652

653
  return code;
×
654
}
655

656
int32_t createGroupOperatorInfo(SOperatorInfo* downstream, SAggPhysiNode* pAggNode, SExecTaskInfo* pTaskInfo,
31,565,965✔
657
                                SOperatorInfo** pOptrInfo) {
658
  QRY_PARAM_CHECK(pOptrInfo);
31,565,965✔
659

660
  int32_t               code = TSDB_CODE_SUCCESS;
31,567,642✔
661
  int32_t               lino = 0;
31,567,642✔
662
  SGroupbyOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SGroupbyOperatorInfo));
31,567,642✔
663
  SOperatorInfo*        pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
31,560,642✔
664
  if (pInfo == NULL || pOperator == NULL) {
31,563,830✔
665
    code = terrno;
19✔
666
    goto _error;
×
667
  }
668
  initOperatorCostInfo(pOperator);
31,565,458✔
669

670
  pOperator->pPhyNode = (SNode*)pAggNode;
31,570,819✔
671
  pOperator->exprSupp.hasWindowOrGroup = true;
31,570,819✔
672
  pOperator->exprSupp.hasWindow = false;
31,570,222✔
673

674
  SSDataBlock* pResBlock = createDataBlockFromDescNode(pAggNode->node.pOutputDataBlockDesc);
31,568,188✔
675
  if (pResBlock == NULL) {
31,572,358✔
676
    code = terrno;
×
677
    goto _error;
×
678
  }
679
  initBasicInfo(&pInfo->binfo, pResBlock);
31,572,358✔
680

681
  initLimitInfo(pAggNode->node.pLimit, pAggNode->node.pSlimit, &pInfo->limitInfo);
31,569,711✔
682

683
  pInfo->pGroupCols = NULL;
31,571,828✔
684
  code = extractColumnInfo(pAggNode->pGroupKeys, &pInfo->pGroupCols);
31,571,828✔
685
  QUERY_CHECK_CODE(code, lino, _error);
31,562,816✔
686

687
  int32_t    numOfScalarExpr = 0;
31,562,816✔
688
  SExprInfo* pScalarExprInfo = NULL;
31,564,826✔
689
  if (pAggNode->pExprs != NULL) {
31,565,276✔
690
    code = createExprInfo(pAggNode->pExprs, NULL, &pScalarExprInfo, &numOfScalarExpr);
15,171,666✔
691
    QUERY_CHECK_CODE(code, lino, _error);
15,169,293✔
692
  }
693

694
  code = initExprSupp(&pInfo->scalarSup, pScalarExprInfo, numOfScalarExpr, &pTaskInfo->storageAPI.functionStore);
31,467,515✔
695
  QUERY_CHECK_CODE(code, lino, _error);
31,470,882✔
696

697
  initResultSizeInfo(&pOperator->resultInfo, 4096);
31,470,882✔
698
  code = blockDataEnsureCapacity(pInfo->binfo.pRes, pOperator->resultInfo.capacity);
31,475,574✔
699
  QUERY_CHECK_CODE(code, lino, _error);
31,478,819✔
700

701
  code = initGroupOptrInfo(&pInfo->pGroupColVals, &pInfo->groupKeyLen, &pInfo->keyBuf, pInfo->pGroupCols);
31,478,819✔
702
  QUERY_CHECK_CODE(code, lino, _error);
31,472,417✔
703

704
  int32_t    num = 0;
31,472,417✔
705
  SExprInfo* pExprInfo = NULL;
31,473,445✔
706

707
  code = createExprInfo(pAggNode->pAggFuncs, pAggNode->pGroupKeys, &pExprInfo, &num);
31,472,993✔
708
  QUERY_CHECK_CODE(code, lino, _error);
31,461,358✔
709

710
  code = initAggSup(&pOperator->exprSupp, &pInfo->aggSup, pExprInfo, num, pInfo->groupKeyLen, pTaskInfo->id.str,
31,461,358✔
711
                    NULL, &pTaskInfo->storageAPI.functionStore);
712
  QUERY_CHECK_CODE(code, lino, _error);
31,469,971✔
713

714
  code = filterInitFromNode((SNode*)pAggNode->node.pConditions, &pOperator->exprSupp.pFilterInfo, 0,
31,470,860✔
715
                            pTaskInfo->pStreamRuntimeInfo);
31,469,971✔
716
  QUERY_CHECK_CODE(code, lino, _error);
31,468,159✔
717

718
  initResultRowInfo(&pInfo->binfo.resultRowInfo);
31,468,159✔
719
  setOperatorInfo(pOperator, "GroupbyAggOperator", 0, true, OP_NOT_OPENED, pInfo, pTaskInfo);
31,468,730✔
720

721
  pInfo->binfo.mergeResultBlock = pAggNode->mergeDataBlock;
31,473,204✔
722
  pInfo->binfo.inputTsOrder = pAggNode->node.inputTsOrder;
31,465,778✔
723
  pInfo->binfo.outputTsOrder = pAggNode->node.outputTsOrder;
31,472,584✔
724

725
  pInfo->pOperator = pOperator;
31,461,699✔
726

727
  pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, hashGroupbyAggregateNext, NULL, destroyGroupOperatorInfo,
31,475,367✔
728
                                         optrDefaultBufFn, NULL, optrDefaultGetNextExtFn, NULL);
729
  setOperatorResetStateFn(pOperator, resetGroupOperState);
31,453,228✔
730
  code = appendDownstream(pOperator, &downstream, 1);
31,462,593✔
731
  QUERY_CHECK_CODE(code, lino, _error);
31,477,249✔
732

733
  *pOptrInfo = pOperator;
31,477,249✔
734
  return TSDB_CODE_SUCCESS;
31,472,749✔
735

736
_error:
92,960✔
737
  if (pInfo != NULL) destroyGroupOperatorInfo(pInfo);
92,960✔
738
  destroyOperatorAndDownstreams(pOperator, &downstream, 1);
92,960✔
739
  pTaskInfo->code = code;
92,960✔
740
  return code;
92,960✔
741
}
742

743
SSDataBlock* createBlockDataNotLoaded(const SOperatorInfo* pOperator, SSDataBlock* pDataBlock) {
×
744
  int32_t code = TSDB_CODE_SUCCESS;
×
745
  int32_t lino = 0;
×
746
  if (pDataBlock == NULL) {
×
747
    return NULL;
×
748
  }
749

750
  SSDataBlock* pDstBlock = NULL;
×
751
  code = createDataBlock(&pDstBlock);
×
752
  QUERY_CHECK_CODE(code, lino, _end);
×
753

754
  pDstBlock->info = pDataBlock->info;
×
755
  pDstBlock->info.id.blockId = pOperator->resultDataBlockId;
×
756
  pDstBlock->info.capacity = 0;
×
757
  pDstBlock->info.rowSize = 0;
×
758

759
  size_t numOfCols = pOperator->exprSupp.numOfExprs;
×
760
  if (pDataBlock->pBlockAgg) {
×
761
    pDstBlock->pBlockAgg = taosMemoryCalloc(numOfCols, sizeof(SColumnDataAgg));
×
762
    if (pDstBlock->pBlockAgg == NULL) {
×
763
      blockDataDestroy(pDstBlock);
×
764
      return NULL;
×
765
    }
766
    for (int i = 0; i < numOfCols; ++i) {
×
767
      pDstBlock->pBlockAgg[i].colId = -1;
×
768
    }
769
  }
770

771
  for (int32_t i = 0; i < pOperator->exprSupp.numOfExprs; ++i) {
×
772
    SExprInfo*       pExpr = &pOperator->exprSupp.pExprInfo[i];
×
773
    int32_t          slotId = pExpr->base.pParam[0].pCol->slotId;
×
774
    SColumnInfoData* pSrc = taosArrayGet(pDataBlock->pDataBlock, slotId);
×
775
    SColumnInfoData  colInfo = {.hasNull = true, .info = pSrc->info};
×
776
    code = blockDataAppendColInfo(pDstBlock, &colInfo);
×
777
    QUERY_CHECK_CODE(code, lino, _end);
×
778

779
    SColumnInfoData* pDst = taosArrayGet(pDstBlock->pDataBlock, i);
×
780
    if (pDataBlock->pBlockAgg && pDataBlock->pBlockAgg[slotId].colId != -1) {
×
781
      pDstBlock->pBlockAgg[i] = pDataBlock->pBlockAgg[slotId];
×
782
    } else {
783
      code = doEnsureCapacity(pDst, &pDstBlock->info, pDataBlock->info.rows, false);
×
784
      QUERY_CHECK_CODE(code, lino, _end);
×
785

786
      code = colDataAssign(pDst, pSrc, pDataBlock->info.rows, &pDataBlock->info);
×
787
      QUERY_CHECK_CODE(code, lino, _end);
×
788
    }
789
  }
790

791
_end:
×
792
  if (code != TSDB_CODE_SUCCESS) {
×
793
    qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
×
794
    blockDataDestroy(pDstBlock);
×
795
    return NULL;
×
796
  }
797
  return pDstBlock;
×
798
}
799

800
static void doHashPartition(SOperatorInfo* pOperator, SSDataBlock* pBlock) {
20,520,147✔
801
  int32_t                 code = TSDB_CODE_SUCCESS;
20,520,147✔
802
  int32_t                 lino = 0;
20,520,147✔
803
  SPartitionOperatorInfo* pInfo = pOperator->info;
20,520,147✔
804
  SExecTaskInfo*          pTaskInfo = pOperator->pTaskInfo;
20,519,590✔
805

806
  for (int32_t j = 0; j < pBlock->info.rows; ++j) {
2,147,483,647✔
807
    recordNewGroupKeys(pInfo->pGroupCols, pInfo->pGroupColVals, pBlock, j);
2,147,483,647✔
808
    int32_t len = buildGroupKeys(pInfo->keyBuf, pInfo->pGroupColVals);
2,147,483,647✔
809

810
    SDataGroupInfo* pGroupInfo = NULL;
2,147,483,647✔
811
    void*           pPage = getCurrentDataGroupInfo(pInfo, &pGroupInfo, len);
2,147,483,647✔
812
    if (pPage == NULL) {
2,147,483,647✔
813
      T_LONG_JMP(pTaskInfo->env, terrno);
×
814
    }
815

816
    pGroupInfo->numOfRows += 1;
2,147,483,647✔
817

818
    // group id
819
    if (pGroupInfo->groupId == 0) {
2,147,483,647✔
820
      pGroupInfo->groupId = calcGroupId(pInfo->keyBuf, len);
75,459,935✔
821
    }
822

823
    if (pBlock->info.dataLoad) {
2,147,483,647✔
824
      // number of rows
825
      int32_t* rows = (int32_t*)pPage;
2,147,483,647✔
826

827
      size_t numOfCols = pOperator->exprSupp.numOfExprs;
2,147,483,647✔
828
      for (int32_t i = 0; i < numOfCols; ++i) {
2,147,483,647✔
829
        SExprInfo* pExpr = &pOperator->exprSupp.pExprInfo[i];
2,147,483,647✔
830
        int32_t    slotId = pExpr->base.pParam[0].pCol->slotId;
2,147,483,647✔
831
        SColumnInfoData* pSrcColInfoData = taosArrayGet(pBlock->pDataBlock, slotId);
2,147,483,647✔
832
        SColumnInfoData* pDstColInfoData = taosArrayGet(pInfo->binfo.pRes->pDataBlock, i);
2,147,483,647✔
833
        QUERY_CHECK_NULL(pSrcColInfoData, code, lino, _end, terrno);
2,147,483,647✔
834
        QUERY_CHECK_NULL(pDstColInfoData, code, lino, _end, terrno);
2,147,483,647✔
835

836
        int32_t bytes = pDstColInfoData->info.bytes;
2,147,483,647✔
837
        int32_t startOffset = pInfo->columnOffset[i];
2,147,483,647✔
838
        int32_t reservedBytes = blockDataGetPagedColumnReservedBytes(pDstColInfoData);
2,147,483,647✔
839

840
        int32_t* columnLen = NULL;
2,147,483,647✔
841
        int32_t  contentLen = 0;
2,147,483,647✔
842

843
        if (IS_VAR_DATA_TYPE(pDstColInfoData->info.type)) {
2,147,483,647✔
844
          int32_t* offset = (int32_t*)((char*)pPage + startOffset);
2,147,483,647✔
845
          columnLen = (int32_t*)((char*)pPage + startOffset + sizeof(int32_t) * pInfo->rowCapacity);
2,147,483,647✔
846
          char* data = (char*)((char*)columnLen + sizeof(int32_t));
2,147,483,647✔
847

848
          if (colDataIsNull_s(pSrcColInfoData, j)) {
2,147,483,647✔
849
            offset[(*rows)] = -1;
2,147,483,647✔
850
            contentLen = 0;
2,147,483,647✔
851
          } else if (pSrcColInfoData->info.type == TSDB_DATA_TYPE_JSON) {
2,147,483,647✔
852
            offset[*rows] = (*columnLen);
25,424✔
853
            char*   src = colDataGetData(pSrcColInfoData, j);
25,424✔
854
            int32_t dataLen = getJsonValueLen(src);
25,017✔
855

856
            memcpy(data + (*columnLen), src, dataLen);
25,824✔
857
            int32_t v = (data + (*columnLen) + dataLen - (char*)pPage);
25,824✔
858
            QUERY_CHECK_CONDITION((v > 0), code, lino, _end, TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
25,824✔
859

860
            contentLen = dataLen;
25,824✔
861
          } else {
862
            if (IS_STR_DATA_BLOB(pSrcColInfoData->info.type)) {
2,147,483,647✔
863
              offset[*rows] = (*columnLen);
3,059,703✔
NEW
864
              char* src = colDataGetData(pSrcColInfoData, j);
×
865
              memcpy(data + (*columnLen), src, blobDataTLen(src));
×
866
              int32_t v = (data + (*columnLen) + blobDataTLen(src) - (char*)pPage);
×
867
              QUERY_CHECK_CONDITION((v > 0), code, lino, _end, TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
×
868

869
              contentLen = blobDataTLen(src);
×
870
            } else {
871
              offset[*rows] = (*columnLen);
2,147,483,647✔
872
              char* src = colDataGetData(pSrcColInfoData, j);
2,147,483,647✔
873
              memcpy(data + (*columnLen), src, varDataTLen(src));
2,147,483,647✔
874
              int32_t v = (data + (*columnLen) + varDataTLen(src) - (char*)pPage);
2,147,483,647✔
875
              QUERY_CHECK_CONDITION((v > 0), code, lino, _end, TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
2,147,483,647✔
876

877
              contentLen = varDataTLen(src);
2,147,483,647✔
878
            }
879
          }
880

881
          QUERY_CHECK_CONDITION((contentLen <= reservedBytes), code, lino, _end,
2,147,483,647✔
882
                                TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
883
          QUERY_CHECK_CONDITION(((*columnLen) + contentLen <= reservedBytes * pInfo->rowCapacity), code, lino, _end,
2,147,483,647✔
884
                                TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
885
        } else {
886
          char* bitmap = (char*)pPage + startOffset;
2,147,483,647✔
887
          columnLen = (int32_t*)((char*)pPage + startOffset + BitmapLen(pInfo->rowCapacity));
2,147,483,647✔
888
          char* data = (char*)columnLen + sizeof(int32_t);
2,147,483,647✔
889

890
          bool isNull = colDataIsNull_f(pSrcColInfoData, j);
2,147,483,647✔
891
          if (isNull) {
2,147,483,647✔
892
            colDataSetNull_f(bitmap, (*rows));
2,147,483,647✔
893
          } else {
894
            memcpy(data + (*columnLen), colDataGetData(pSrcColInfoData, j), bytes);
2,147,483,647✔
895
            QUERY_CHECK_CONDITION(((data + (*columnLen) + bytes - (char*)pPage) <= getBufPageSize(pInfo->pBuf)), code,
2,147,483,647✔
896
                                  lino, _end, TSDB_CODE_QRY_EXECUTOR_INTERNAL_ERROR);
897
          }
898
          contentLen = bytes;
2,147,483,647✔
899
        }
900

901
        (*columnLen) += contentLen;
2,147,483,647✔
902
      }
903

904
      (*rows) += 1;
2,147,483,647✔
905

906
      setBufPageDirty(pPage, true);
2,147,483,647✔
907
      releaseBufPage(pInfo->pBuf, pPage);
2,147,483,647✔
908
    } else {
909
      SSDataBlock* dataNotLoadBlock = createBlockDataNotLoaded(pOperator, pBlock);
×
910
      if (dataNotLoadBlock == NULL) {
×
911
        T_LONG_JMP(pTaskInfo->env, terrno);
×
912
      }
913
      if (pGroupInfo->blockForNotLoaded == NULL) {
×
914
        pGroupInfo->blockForNotLoaded = taosArrayInit(0, sizeof(SSDataBlock*));
×
915
        QUERY_CHECK_NULL(pGroupInfo->blockForNotLoaded, code, lino, _end, terrno);
×
916
        pGroupInfo->offsetForNotLoaded = 0;
×
917
      }
918
      dataNotLoadBlock->info.id.groupId = pGroupInfo->groupId;
×
919
      dataNotLoadBlock->info.dataLoad = 0;
×
920
      void* tmp = taosArrayPush(pGroupInfo->blockForNotLoaded, &dataNotLoadBlock);
×
921
      QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
×
922
      break;
×
923
    }
924
  }
925

926
_end:
21,968,255✔
927
  if (code != TSDB_CODE_SUCCESS) {
20,526,797✔
928
    qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
×
929
    T_LONG_JMP(pTaskInfo->env, code);
×
930
  }
931
}
20,526,797✔
932

933
void* getCurrentDataGroupInfo(const SPartitionOperatorInfo* pInfo, SDataGroupInfo** pGroupInfo, int32_t len) {
2,147,483,647✔
934
  int32_t         code = TSDB_CODE_SUCCESS;
2,147,483,647✔
935
  int32_t         lino = 0;
2,147,483,647✔
936
  SDataGroupInfo* p = taosHashGet(pInfo->pGroupSet, pInfo->keyBuf, len);
2,147,483,647✔
937

938
  void* pPage = NULL;
2,147,483,647✔
939
  if (p == NULL) {  // it is a new group
2,147,483,647✔
940
    SDataGroupInfo gi = {0};
75,455,205✔
941
    gi.pPageList = taosArrayInit(100, sizeof(int32_t));
75,455,205✔
942
    QUERY_CHECK_NULL(gi.pPageList, code, lino, _end, terrno);
75,450,204✔
943

944
    code = taosHashPut(pInfo->pGroupSet, pInfo->keyBuf, len, &gi, sizeof(SDataGroupInfo));
75,450,204✔
945
    if (code == TSDB_CODE_DUP_KEY) {
75,459,221✔
946
      code = TSDB_CODE_SUCCESS;
×
947
    }
948
    QUERY_CHECK_CODE(code, lino, _end);
75,459,221✔
949

950
    p = taosHashGet(pInfo->pGroupSet, pInfo->keyBuf, len);
75,459,221✔
951

952
    int32_t pageId = 0;
75,462,010✔
953
    pPage = getNewBufPage(pInfo->pBuf, &pageId);
75,462,010✔
954
    if (pPage == NULL) {
75,460,575✔
955
      return pPage;
×
956
    }
957

958
    void* tmp = taosArrayPush(p->pPageList, &pageId);
75,460,575✔
959
    QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
75,461,278✔
960

961
    *(int32_t*)pPage = 0;
75,461,278✔
962
  } else {
963
    int32_t* curId = taosArrayGetLast(p->pPageList);
2,147,483,647✔
964
    pPage = getBufPage(pInfo->pBuf, *curId);
2,147,483,647✔
965
    if (pPage == NULL) {
2,147,483,647✔
966
      qError("failed to get buffer, code:%s", tstrerror(terrno));
×
967
      return pPage;
×
968
    }
969

970
    int32_t* rows = (int32_t*)pPage;
2,147,483,647✔
971
    if (*rows >= pInfo->rowCapacity) {
2,147,483,647✔
972
      // release buffer
973
      releaseBufPage(pInfo->pBuf, pPage);
269,240,522✔
974

975
      // add a new page for current group
976
      int32_t pageId = 0;
269,236,691✔
977
      pPage = getNewBufPage(pInfo->pBuf, &pageId);
269,237,166✔
978
      if (pPage == NULL) {
269,235,297✔
979
        qError("failed to get new buffer, code:%s", tstrerror(terrno));
×
980
        return NULL;
×
981
      }
982

983
      void* tmp = taosArrayPush(p->pPageList, &pageId);
269,235,297✔
984
      QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
269,241,947✔
985

986
      memset(pPage, 0, getBufPageSize(pInfo->pBuf));
269,241,947✔
987
    }
988
  }
989

990
  *pGroupInfo = p;
2,147,483,647✔
991

992
_end:
2,147,483,647✔
993
  if (code != TSDB_CODE_SUCCESS) {
2,147,483,647✔
994
    qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
×
995
    return NULL;
×
996
  }
997

998
  return pPage;
2,147,483,647✔
999
}
1000

1001
int32_t* setupColumnOffset(const SSDataBlock* pBlock, int32_t rowCapacity) {
3,004,588✔
1002
  size_t   numOfCols = taosArrayGetSize(pBlock->pDataBlock);
3,004,588✔
1003
  int32_t* offset = taosMemoryCalloc(numOfCols, sizeof(int32_t));
3,004,195✔
1004
  if (!offset) {
3,001,874✔
1005
    return NULL;
×
1006
  }
1007

1008
  offset[0] = sizeof(int32_t) +
3,001,874✔
1009
              sizeof(uint64_t);  // the number of rows in current page, ref to SSDataBlock paged serialization format
1010

1011
  for (int32_t i = 0; i < numOfCols - 1; ++i) {
9,594,346✔
1012
    SColumnInfoData* pColInfoData = taosArrayGet(pBlock->pDataBlock, i);
6,591,660✔
1013

1014
    int32_t payloadLen = blockDataGetPagedColumnReservedBytes(pColInfoData) * rowCapacity;
6,588,300✔
1015

1016
    if (IS_VAR_DATA_TYPE(pColInfoData->info.type)) {
6,588,701✔
1017
      // offset segment + content length + payload
1018
      offset[i + 1] = rowCapacity * sizeof(int32_t) + sizeof(int32_t) + payloadLen + offset[i];
1,247,717✔
1019
    } else {
1020
      // bitmap + content length + payload
1021
      offset[i + 1] = BitmapLen(rowCapacity) + sizeof(int32_t) + payloadLen + offset[i];
5,339,153✔
1022
    }
1023
  }
1024

1025
  return offset;
3,002,686✔
1026
}
1027

1028
static void clearPartitionOperator(SPartitionOperatorInfo* pInfo) {
2,882,197✔
1029
  int32_t size = taosArrayGetSize(pInfo->sortedGroupArray);
2,882,197✔
1030
  for (int32_t i = 0; i < size; i++) {
45,462,308✔
1031
    SDataGroupInfo* pGp = taosArrayGet(pInfo->sortedGroupArray, i);
42,580,519✔
1032
    if (pGp && pGp->blockForNotLoaded) {
42,580,125✔
1033
      for (int32_t i = 0; i < pGp->blockForNotLoaded->size; i++) {
×
1034
        SSDataBlock** pBlock = taosArrayGet(pGp->blockForNotLoaded, i);
×
1035
        if (pBlock) blockDataDestroy(*pBlock);
×
1036
      }
1037
      taosArrayClear(pGp->blockForNotLoaded);
×
1038
      pGp->offsetForNotLoaded = 0;
×
1039
    }
1040
    taosArrayDestroy(pGp->pPageList);
42,580,919✔
1041
  }
1042
  taosArrayClear(pInfo->sortedGroupArray);
2,881,789✔
1043
  clearDiskbasedBuf(pInfo->pBuf);
2,880,982✔
1044
}
2,881,390✔
1045

1046
static int compareDataGroupInfo(const void* group1, const void* group2) {
694,043,342✔
1047
  const SDataGroupInfo* pGroupInfo1 = group1;
694,043,342✔
1048
  const SDataGroupInfo* pGroupInfo2 = group2;
694,043,342✔
1049

1050
  if (pGroupInfo1->groupId == pGroupInfo2->groupId) {
694,043,342✔
1051
    return 0;
×
1052
  }
1053

1054
  return (pGroupInfo1->groupId < pGroupInfo2->groupId) ? -1 : 1;
694,044,549✔
1055
}
1056

1057
static SSDataBlock* buildPartitionResultForNotLoadBlock(SDataGroupInfo* pGroupInfo) {
43,294,915✔
1058
  if (pGroupInfo->blockForNotLoaded && pGroupInfo->offsetForNotLoaded < pGroupInfo->blockForNotLoaded->size) {
43,294,915✔
1059
    SSDataBlock** pBlock = taosArrayGet(pGroupInfo->blockForNotLoaded, pGroupInfo->offsetForNotLoaded);
×
1060
    if (!pBlock) {
×
1061
      return NULL;
×
1062
    }
1063
    pGroupInfo->offsetForNotLoaded++;
×
1064
    return *pBlock;
×
1065
  }
1066
  return NULL;
43,294,915✔
1067
}
1068

1069
static SSDataBlock* buildPartitionResult(SOperatorInfo* pOperator) {
317,755,178✔
1070
  int32_t                 code = TSDB_CODE_SUCCESS;
317,755,178✔
1071
  int32_t                 lino = 0;
317,755,178✔
1072
  SPartitionOperatorInfo* pInfo = pOperator->info;
317,755,178✔
1073
  SExecTaskInfo*          pTaskInfo = pOperator->pTaskInfo;
317,755,277✔
1074

1075
  if (pInfo->remainRows == 0) {
317,754,395✔
1076
    blockDataCleanup(pInfo->binfo.pRes);
292,027,681✔
1077
    SDataGroupInfo* pGroupInfo =
292,028,525✔
1078
        (pInfo->groupIndex != -1) ? taosArrayGet(pInfo->sortedGroupArray, pInfo->groupIndex) : NULL;
292,030,388✔
1079
    if (pInfo->groupIndex == -1 || pInfo->pageIndex >= taosArrayGetSize(pGroupInfo->pPageList)) {
292,028,525✔
1080
      if (pGroupInfo != NULL) {
46,280,971✔
1081
        SSDataBlock* ret = buildPartitionResultForNotLoadBlock(pGroupInfo);
43,296,129✔
1082
        if (ret != NULL) return ret;
43,294,915✔
1083
      }
1084
      // try next group data
1085
      if (pInfo->groupIndex + 1 >= taosArrayGetSize(pInfo->sortedGroupArray)) {
46,279,757✔
1086
        setOperatorCompleted(pOperator);
2,882,597✔
1087
        clearPartitionOperator(pInfo);
2,883,011✔
1088
        return NULL;
2,881,390✔
1089
      }
1090
      ++pInfo->groupIndex;
43,398,500✔
1091

1092
      pGroupInfo = taosArrayGet(pInfo->sortedGroupArray, pInfo->groupIndex);
43,398,500✔
1093
      if (pGroupInfo == NULL) {
43,397,686✔
1094
        qError("failed to get buffer, code:%s, %s", tstrerror(terrno), GET_TASKID(pTaskInfo));
×
1095
        T_LONG_JMP(pTaskInfo->env, terrno);
×
1096
      }
1097
      pInfo->pageIndex = 0;
43,397,686✔
1098
    }
1099

1100
    int32_t* pageId = taosArrayGet(pGroupInfo->pPageList, pInfo->pageIndex);
289,146,703✔
1101
    if (pageId == NULL) {
289,145,688✔
1102
      qError("failed to get buffer, code:%s, %s", tstrerror(terrno), GET_TASKID(pTaskInfo));
×
1103
      T_LONG_JMP(pTaskInfo->env, terrno);
×
1104
    }
1105
    void* page = getBufPage(pInfo->pBuf, *pageId);
289,145,688✔
1106
    if (page == NULL) {
289,144,263✔
1107
      qError("failed to get buffer, code:%s, %s", tstrerror(terrno), GET_TASKID(pTaskInfo));
×
1108
      T_LONG_JMP(pTaskInfo->env, terrno);
×
1109
    }
1110
    if (*(int32_t*)page == 0) {
289,144,263✔
1111
      releaseBufPage(pInfo->pBuf, page);
×
1112
      SSDataBlock* ret = buildPartitionResultForNotLoadBlock(pGroupInfo);
×
1113
      if (ret != NULL) return ret;
×
1114
      if (pInfo->groupIndex + 1 < taosArrayGetSize(pInfo->sortedGroupArray)) {
×
1115
        pInfo->groupIndex++;
×
1116
        pInfo->pageIndex = 0;
×
1117
      } else {
1118
        setOperatorCompleted(pOperator);
×
1119
        clearPartitionOperator(pInfo);
×
1120
        return NULL;
×
1121
      }
1122
      return buildPartitionResult(pOperator);
×
1123
    }
1124

1125
    code = blockDataEnsureCapacity(pInfo->binfo.pRes, pInfo->rowCapacity);
289,144,263✔
1126
    QUERY_CHECK_CODE(code, lino, _end);
289,145,688✔
1127

1128
    code = blockDataFromBuf1(pInfo->binfo.pRes, page, pInfo->rowCapacity);
289,145,688✔
1129
    QUERY_CHECK_CODE(code, lino, _end);
289,145,996✔
1130

1131
    pInfo->pageIndex += 1;
289,145,996✔
1132
    releaseBufPage(pInfo->pBuf, page);
289,145,182✔
1133
    pInfo->binfo.pRes->info.id.groupId = pGroupInfo->groupId;
289,143,695✔
1134
    pInfo->binfo.pRes->info.dataLoad = 1;
289,144,984✔
1135
    pInfo->orderedRows = 0;
289,143,763✔
1136
  } else if (pInfo->pOrderInfoArr == NULL) {
25,729,761✔
1137
    qError("Exception, remainRows not zero, but pOrderInfoArr is NULL");
×
1138
  }
1139

1140
  if (pInfo->pOrderInfoArr) {
314,873,531✔
1141
    pInfo->binfo.pRes->info.rows += pInfo->remainRows;
76,945,569✔
1142
    code = blockDataTrimFirstRows(pInfo->binfo.pRes, pInfo->orderedRows);
76,946,044✔
1143
    QUERY_CHECK_CODE(code, lino, _end);
76,944,619✔
1144
    pInfo->orderedRows = blockDataGetSortedRows(pInfo->binfo.pRes, pInfo->pOrderInfoArr);
76,944,619✔
1145
    pInfo->remainRows = pInfo->binfo.pRes->info.rows - pInfo->orderedRows;
76,946,519✔
1146
    pInfo->binfo.pRes->info.rows = pInfo->orderedRows;
76,946,994✔
1147
  }
1148

1149
  code = blockDataUpdateTsWindow(pInfo->binfo.pRes, 0);
314,873,931✔
1150
  QUERY_CHECK_CODE(code, lino, _end);
314,871,717✔
1151

1152
_end:
314,871,717✔
1153
  if (code != TSDB_CODE_SUCCESS) {
314,871,717✔
1154
    qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
×
1155
    T_LONG_JMP(pTaskInfo->env, code);
×
1156
  }
1157

1158
  return pInfo->binfo.pRes;
314,871,717✔
1159
}
1160

1161
static int32_t hashPartitionNext(SOperatorInfo* pOperator, SSDataBlock** ppRes) {
317,786,113✔
1162
  if (pOperator->status == OP_EXEC_DONE) {
317,786,113✔
1163
    (*ppRes) = NULL;
12,843✔
1164
    return TSDB_CODE_SUCCESS;
12,843✔
1165
  }
1166

1167
  int32_t                 code = TSDB_CODE_SUCCESS;
317,770,959✔
1168
  int32_t                 lino = 0;
317,770,959✔
1169
  SExecTaskInfo*          pTaskInfo = pOperator->pTaskInfo;
317,770,959✔
1170
  SPartitionOperatorInfo* pInfo = pOperator->info;
317,772,224✔
1171
  SSDataBlock*            pRes = pInfo->binfo.pRes;
317,770,205✔
1172

1173
  if (pOperator->status == OP_RES_TO_RETURN) {
317,775,427✔
1174
    (*ppRes) = buildPartitionResult(pOperator);
314,771,463✔
1175
    return code;
314,773,146✔
1176
  }
1177

1178
  while (1) {
20,525,990✔
1179
    SSDataBlock* pBlock = getNextBlockFromDownstream(pOperator, 0);
23,532,040✔
1180
    if (pBlock == NULL) {
23,500,643✔
1181
      break;
2,985,789✔
1182
    }
1183

1184
    pInfo->binfo.pRes->info.scanFlag = pBlock->info.scanFlag;
20,514,854✔
1185
    // there is an scalar expression that needs to be calculated right before apply the group aggregation.
1186
    if (pInfo->scalarSup.pExprInfo != NULL) {
20,525,963✔
1187
      code =
1188
          projectApplyFunctions(pInfo->scalarSup.pExprInfo, pBlock, pBlock, pInfo->scalarSup.pCtx,
105,254✔
1189
                                pInfo->scalarSup.numOfExprs, NULL, GET_STM_RTINFO(pOperator->pTaskInfo));
105,254✔
1190
      QUERY_CHECK_CODE(code, lino, _end);
105,254✔
1191
    }
1192

1193
    terrno = TSDB_CODE_SUCCESS;
20,524,422✔
1194
    doHashPartition(pOperator, pBlock);
20,523,472✔
1195
    if (terrno != TSDB_CODE_SUCCESS) {  // group by json error
20,525,379✔
1196
      code = terrno;
×
1197
      QUERY_CHECK_CODE(code, lino, _end);
68✔
1198
    }
1199
  }
1200

1201
  SArray* groupArray = taosArrayInit(taosHashGetSize(pInfo->pGroupSet), sizeof(SDataGroupInfo));
2,985,789✔
1202
  QUERY_CHECK_NULL(groupArray, code, lino, _end, terrno);
2,985,375✔
1203

1204
  void* pGroupIter = taosHashIterate(pInfo->pGroupSet, NULL);
2,985,375✔
1205
  while (pGroupIter != NULL) {
78,448,349✔
1206
    SDataGroupInfo* pGroupInfo = pGroupIter;
75,461,753✔
1207
    void*           tmp = taosArrayPush(groupArray, pGroupInfo);
75,462,960✔
1208
    QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
75,462,960✔
1209
    pGroupIter = taosHashIterate(pInfo->pGroupSet, pGroupIter);
75,462,960✔
1210
  }
1211

1212
  taosArraySort(groupArray, compareDataGroupInfo);
2,986,596✔
1213
  pInfo->sortedGroupArray = groupArray;
2,985,389✔
1214
  pInfo->groupIndex = -1;
2,985,796✔
1215
  taosHashClear(pInfo->pGroupSet);
2,985,389✔
1216

1217
  pOperator->status = OP_RES_TO_RETURN;
2,985,389✔
1218
  code = blockDataEnsureCapacity(pRes, 4096);
2,985,389✔
1219
  QUERY_CHECK_CODE(code, lino, _end);
2,986,596✔
1220

1221
_end:
2,986,596✔
1222
  if (code != TSDB_CODE_SUCCESS) {
2,986,596✔
1223
    qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
×
1224
    pTaskInfo->code = code;
×
1225
    T_LONG_JMP(pTaskInfo->env, code);
×
1226
  }
1227

1228
  (*ppRes) = buildPartitionResult(pOperator);
2,986,596✔
1229
  return code;
2,986,596✔
1230
}
1231

1232
static void destroyPartitionOperatorInfo(void* param) {
3,025,395✔
1233
  SPartitionOperatorInfo* pInfo = (SPartitionOperatorInfo*)param;
3,025,395✔
1234
  cleanupBasicInfo(&pInfo->binfo);
3,025,395✔
1235
  taosArrayDestroy(pInfo->pGroupCols);
3,025,796✔
1236

1237
  for (int i = 0; i < taosArrayGetSize(pInfo->pGroupColVals); i++) {
6,848,045✔
1238
    SGroupKeys key = *(SGroupKeys*)taosArrayGet(pInfo->pGroupColVals, i);
3,823,470✔
1239
    taosMemoryFree(key.pData);
3,823,470✔
1240
  }
1241

1242
  taosArrayDestroy(pInfo->pGroupColVals);
3,024,181✔
1243
  taosMemoryFree(pInfo->keyBuf);
3,023,379✔
1244

1245
  int32_t size = taosArrayGetSize(pInfo->sortedGroupArray);
3,023,373✔
1246
  for (int32_t i = 0; i < size; i++) {
35,907,430✔
1247
    SDataGroupInfo* pGp = taosArrayGet(pInfo->sortedGroupArray, i);
32,881,634✔
1248
    if (pGp) {
32,881,634✔
1249
      taosArrayDestroy(pGp->pPageList);
32,881,634✔
1250
    }
1251
  }
1252
  taosArrayDestroy(pInfo->sortedGroupArray);
3,025,796✔
1253

1254
  void* pGroupIter = taosHashIterate(pInfo->pGroupSet, NULL);
3,022,820✔
1255
  while (pGroupIter != NULL) {
3,025,796✔
1256
    SDataGroupInfo* pGroupInfo = pGroupIter;
×
1257
    taosArrayDestroy(pGroupInfo->pPageList);
×
1258
    pGroupIter = taosHashIterate(pInfo->pGroupSet, pGroupIter);
×
1259
  }
1260

1261
  taosHashCleanup(pInfo->pGroupSet);
3,025,796✔
1262
  taosMemoryFree(pInfo->columnOffset);
3,023,633✔
1263

1264
  cleanupExprSupp(&pInfo->scalarSup);
3,024,589✔
1265
  destroyDiskbasedBuf(pInfo->pBuf);
3,024,988✔
1266
  taosArrayDestroy(pInfo->pOrderInfoArr);
3,023,228✔
1267
  taosMemoryFreeClear(param);
3,022,414✔
1268
}
3,024,829✔
1269

1270
static int32_t resetPartitionOperState(SOperatorInfo* pOper) {
×
1271
  SPartitionOperatorInfo* pInfo = pOper->info;
×
1272
  SExecTaskInfo*           pTaskInfo = pOper->pTaskInfo;
×
1273
  SPartitionPhysiNode* pPhynode = (SPartitionPhysiNode*)pOper->pPhyNode;
×
1274
  resetBasicOperatorState(&pInfo->binfo);
×
1275

1276
  int32_t code = resetExprSupp(&pInfo->scalarSup, pTaskInfo, pPhynode->pExprs, NULL,
×
1277
    &pTaskInfo->storageAPI.functionStore);
1278

1279
  clearPartitionOperator(pInfo);
×
1280

1281
  void* pGroupIter = taosHashIterate(pInfo->pGroupSet, NULL);
×
1282
  while (pGroupIter != NULL) {
×
1283
    SDataGroupInfo* pGroupInfo = pGroupIter;
×
1284
    taosArrayDestroy(pGroupInfo->pPageList);
×
1285
    pGroupIter = taosHashIterate(pInfo->pGroupSet, pGroupIter);
×
1286
  }
1287
  taosHashClear(pInfo->pGroupSet);
×
1288

1289
  int32_t size = taosArrayGetSize(pInfo->sortedGroupArray);
×
1290
  for (int32_t i = 0; i < size; i++) {
×
1291
    SDataGroupInfo* pGp = taosArrayGet(pInfo->sortedGroupArray, i);
×
1292
    if (pGp) {
×
1293
      taosArrayDestroy(pGp->pPageList);
×
1294
    }
1295
  }
1296
  taosArrayDestroy(pInfo->sortedGroupArray);
×
1297
  pInfo->sortedGroupArray = NULL;
×
1298

1299
  pInfo->groupIndex = 0;
×
1300
  pInfo->pageIndex = 0;
×
1301
  pInfo->remainRows = 0;
×
1302
  pInfo->orderedRows = 0;
×
1303
  return 0;
×
1304
}
1305

1306
int32_t createPartitionOperatorInfo(SOperatorInfo* downstream, SPartitionPhysiNode* pPartNode,
3,024,988✔
1307
                                           SExecTaskInfo* pTaskInfo, SOperatorInfo** pOptrInfo) {
1308
  QRY_PARAM_CHECK(pOptrInfo);
3,024,988✔
1309

1310
  int32_t                 code = TSDB_CODE_SUCCESS;
3,025,389✔
1311
  int32_t                 lino = 0;
3,025,389✔
1312
  SPartitionOperatorInfo* pInfo = taosMemoryCalloc(1, sizeof(SPartitionOperatorInfo));
3,025,389✔
1313
  SOperatorInfo*          pOperator = taosMemoryCalloc(1, sizeof(SOperatorInfo));
3,019,019✔
1314
  if (pInfo == NULL || pOperator == NULL) {
3,023,621✔
1315
    pTaskInfo->code = code = terrno;
147✔
1316
    goto _error;
×
1317
  }
1318
  initOperatorCostInfo(pOperator);
3,023,474✔
1319

1320
  pOperator->pPhyNode = pPartNode;
3,024,181✔
1321
  int32_t    numOfCols = 0;
3,024,181✔
1322
  SExprInfo* pExprInfo = NULL;
3,024,989✔
1323
  code = createExprInfo(pPartNode->pTargets, NULL, &pExprInfo, &numOfCols);
3,023,361✔
1324
  QUERY_CHECK_CODE(code, lino, _error);
3,025,389✔
1325
  pOperator->exprSupp.numOfExprs = numOfCols;
3,025,389✔
1326
  pOperator->exprSupp.pExprInfo = pExprInfo;
3,025,389✔
1327

1328
  pInfo->pGroupCols = makeColumnArrayFromList(pPartNode->pPartitionKeys);
3,023,315✔
1329

1330
  if (pPartNode->needBlockOutputTsOrder) {
3,020,640✔
1331
    SBlockOrderInfo order = {.order = ORDER_ASC, .pColData = NULL, .nullFirst = false, .slotId = pPartNode->tsSlotId};
270,764✔
1332
    pInfo->pOrderInfoArr = taosArrayInit(1, sizeof(SBlockOrderInfo));
270,764✔
1333
    if (!pInfo->pOrderInfoArr) {
270,751✔
1334
      pTaskInfo->code = terrno;
×
1335
      goto _error;
×
1336
    }
1337

1338
    void* tmp = taosArrayPush(pInfo->pOrderInfoArr, &order);
271,311✔
1339
    QUERY_CHECK_NULL(tmp, code, lino, _error, terrno);
271,311✔
1340
  }
1341

1342
  if (pPartNode->pExprs != NULL) {
3,021,854✔
1343
    int32_t    num = 0;
84,238✔
1344
    SExprInfo* pExprInfo1 = NULL;
84,238✔
1345
    code = createExprInfo(pPartNode->pExprs, NULL, &pExprInfo1, &num);
84,238✔
1346
    QUERY_CHECK_CODE(code, lino, _error);
83,827✔
1347

1348
    code = initExprSupp(&pInfo->scalarSup, pExprInfo1, num, &pTaskInfo->storageAPI.functionStore);
64,227✔
1349
    QUERY_CHECK_CODE(code, lino, _error);
64,638✔
1350
  }
1351

1352
  _hash_fn_t hashFn = taosGetDefaultHashFunction(TSDB_DATA_TYPE_BINARY);
3,004,981✔
1353
  pInfo->pGroupSet = taosHashInit(100, hashFn, false, HASH_NO_LOCK);
3,004,988✔
1354
  if (pInfo->pGroupSet == NULL) {
3,006,196✔
1355
    goto _error;
×
1356
  }
1357

1358
  uint32_t defaultPgsz = 0;
3,005,796✔
1359
  int64_t  defaultBufsz = 0;
3,006,196✔
1360

1361
  pInfo->binfo.pRes = createDataBlockFromDescNode(pPartNode->node.pOutputDataBlockDesc);
3,006,196✔
1362
  QUERY_CHECK_NULL(pInfo->binfo.pRes, code, lino, _error, terrno);
3,005,789✔
1363
  code = getBufferPgSize(pInfo->binfo.pRes->info.rowSize, &defaultPgsz, &defaultBufsz);
3,003,374✔
1364
  if (code != TSDB_CODE_SUCCESS) {
3,004,989✔
1365
    goto _error;
×
1366
  }
1367

1368
  if (!osTempSpaceAvailable()) {
3,004,989✔
1369
    terrno = TSDB_CODE_NO_DISKSPACE;
×
1370
    qError("Create partition operator info failed since %s, tempDir:%s", terrstr(), tsTempDir);
×
1371
    goto _error;
×
1372
  }
1373

1374
  code = createDiskbasedBuf(&pInfo->pBuf, defaultPgsz, defaultBufsz, pTaskInfo->id.str, tsTempDir);
3,004,581✔
1375
  if (code != TSDB_CODE_SUCCESS) {
3,004,574✔
1376
    goto _error;
×
1377
  }
1378

1379
  pInfo->rowCapacity =
3,001,861✔
1380
      getPartitionPageRowCapacity(pInfo->binfo.pRes, getBufPageSize(pInfo->pBuf),
3,002,140✔
1381
                                  blockDataGetSerialMetaSize(taosArrayGetSize(pInfo->binfo.pRes->pDataBlock)));
3,004,574✔
1382
  if (pInfo->rowCapacity < 0) {
3,002,828✔
1383
    code = terrno;
×
1384
    goto _error;
×
1385
  }
1386

1387
  pInfo->columnOffset = setupColumnOffset(pInfo->binfo.pRes, pInfo->rowCapacity);
3,001,473✔
1388
  QUERY_CHECK_NULL(pInfo->columnOffset, code, lino, _error, terrno);
3,003,888✔
1389

1390
  code = initGroupOptrInfo(&pInfo->pGroupColVals, &pInfo->groupKeyLen, &pInfo->keyBuf, pInfo->pGroupCols);
2,996,464✔
1391
  if (code != TSDB_CODE_SUCCESS) {
3,001,046✔
1392
    goto _error;
×
1393
  }
1394

1395
  setOperatorInfo(pOperator, "PartitionOperator", QUERY_NODE_PHYSICAL_PLAN_PARTITION, false, OP_NOT_OPENED, pInfo,
3,001,046✔
1396
                  pTaskInfo);
1397

1398
  pOperator->fpSet = createOperatorFpSet(optrDummyOpenFn, hashPartitionNext, NULL, destroyPartitionOperatorInfo,
3,003,787✔
1399
                                         optrDefaultBufFn, NULL, optrDefaultGetNextExtFn, NULL);
1400

1401
  setOperatorResetStateFn(pOperator, resetPartitionOperState);
3,002,414✔
1402
  code = appendDownstream(pOperator, &downstream, 1);
2,997,699✔
1403
  if (code != TSDB_CODE_SUCCESS) {
3,004,588✔
1404
    goto _error;
×
1405
  }
1406

1407
  *pOptrInfo = pOperator;
3,004,588✔
1408
  return TSDB_CODE_SUCCESS;
3,004,988✔
1409

1410
_error:
19,600✔
1411
  if (pInfo != NULL) {
19,600✔
1412
    destroyPartitionOperatorInfo(pInfo);
19,600✔
1413
  }
1414
  pTaskInfo->code = code;
19,600✔
1415
  destroyOperatorAndDownstreams(pOperator, &downstream, 1);
19,600✔
1416
  TAOS_RETURN(code);
19,600✔
1417
}
1418

1419
int32_t setGroupResultOutputBuf(SOperatorInfo* pOperator, SOptrBasicInfo* binfo, int32_t numOfCols, char* pData,
2,147,483,647✔
1420
                                int32_t bytes, uint64_t groupId, SDiskbasedBuf* pBuf, SAggSupporter* pAggSup) {
1421
  SExecTaskInfo*  pTaskInfo = pOperator->pTaskInfo;
2,147,483,647✔
1422
  SResultRowInfo* pResultRowInfo = &binfo->resultRowInfo;
2,147,483,647✔
1423
  SqlFunctionCtx* pCtx = pOperator->exprSupp.pCtx;
2,147,483,647✔
1424

1425
  SResultRow* pResultRow = doSetResultOutBufByKey(pBuf, pResultRowInfo, (char*)pData, bytes, true, groupId, pTaskInfo,
2,147,483,647✔
1426
                                                  false, pAggSup, false);
1427
  if (pResultRow == NULL || pTaskInfo->code != 0) {
2,147,483,647✔
1428
    return pTaskInfo->code;
248,853✔
1429
  }
1430

1431
  return setResultRowInitCtx(pResultRow, pCtx, numOfCols, pOperator->exprSupp.rowEntryInfoOffset);
2,147,483,647✔
1432
}
1433

1434
void freePartItem(void* ptr) {
×
1435
  SPartitionDataInfo* pPart = (SPartitionDataInfo*)ptr;
×
1436
  taosArrayDestroy(pPart->rowIds);
×
1437
}
×
1438

1439
int32_t extractColumnInfo(SNodeList* pNodeList, SArray** pArrayRes) {
31,567,536✔
1440
  int32_t code = TSDB_CODE_SUCCESS;
31,567,536✔
1441
  int32_t lino = 0;
31,567,536✔
1442
  size_t  numOfCols = LIST_LENGTH(pNodeList);
31,567,536✔
1443
  SArray* pList = taosArrayInit(numOfCols, sizeof(SColumn));
31,570,665✔
1444
  if (pList == NULL) {
31,565,292✔
1445
    code = terrno;
×
1446
    (*pArrayRes) = NULL;
×
UNCOV
1447
    QUERY_CHECK_CODE(code, lino, _end);
×
1448
  }
1449

1450
  for (int32_t i = 0; i < numOfCols; ++i) {
80,410,997✔
1451
    STargetNode* pNode = (STargetNode*)nodesListGetNode(pNodeList, i);
48,851,755✔
1452
    QUERY_CHECK_NULL(pNode, code, lino, _end, terrno);
48,842,128✔
1453

1454
    if (nodeType(pNode->pExpr) == QUERY_NODE_COLUMN) {
48,842,128✔
1455
      SColumnNode* pColNode = (SColumnNode*)pNode->pExpr;
48,849,043✔
1456

1457
      SColumn c = extractColumnFromColumnNode(pColNode);
48,850,026✔
1458
      void*   tmp = taosArrayPush(pList, &c);
48,854,280✔
1459
      QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
48,854,280✔
1460
    } else if (nodeType(pNode->pExpr) == QUERY_NODE_VALUE) {
×
1461
      SValueNode* pValNode = (SValueNode*)pNode->pExpr;
×
1462
      SColumn     c = {0};
×
1463
      c.slotId = pNode->slotId;
×
1464
      c.colId = pNode->slotId;
×
1465
      c.type = pValNode->node.type;
×
1466
      c.bytes = pValNode->node.resType.bytes;
×
1467
      c.scale = pValNode->node.resType.scale;
×
1468
      c.precision = pValNode->node.resType.precision;
×
1469

1470
      void* tmp = taosArrayPush(pList, &c);
×
1471
      QUERY_CHECK_NULL(tmp, code, lino, _end, terrno);
×
1472
    }
1473
  }
1474

1475
  (*pArrayRes) = pList;
31,559,242✔
1476

1477
_end:
31,574,672✔
1478
  if (code != TSDB_CODE_SUCCESS) {
31,574,672✔
1479
    qError("%s failed at line %d since %s", __func__, lino, tstrerror(code));
×
1480
  }
1481
  return code;
31,565,579✔
1482
}
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2026 Coveralls, Inc