• Home
  • Features
  • Pricing
  • Docs
  • Announcements
  • Sign In

georgia-tech-db / eva / #758

04 Sep 2023 08:37PM UTC coverage: 0.0% (-78.3%) from 78.333%
#758

push

circle-ci

hershd23
Increased underline length in at line 75 in text_summarization.rst
	modified:   docs/source/benchmarks/text_summarization.rst

0 of 11303 relevant lines covered (0.0%)

0.0 hits per line

Source File
Press 'n' to go to next uncovered line, 'b' for previous

0.0
/evadb/executor/groupby_executor.py
1
# coding=utf-8
2
# Copyright 2018-2023 EvaDB
3
#
4
# Licensed under the Apache License, Version 2.0 (the "License");
5
# you may not use this file except in compliance with the License.
6
# You may obtain a copy of the License at
7
#
8
#     http://www.apache.org/licenses/LICENSE-2.0
9
#
10
# Unless required by applicable law or agreed to in writing, software
11
# distributed under the License is distributed on an "AS IS" BASIS,
12
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
# See the License for the specific language governing permissions and
14
# limitations under the License.
15
import re
×
16
from typing import Iterator
×
17

18
import pandas as pd
×
19

20
from evadb.database import EvaDBDatabase
×
21
from evadb.executor.abstract_executor import AbstractExecutor
×
22
from evadb.models.storage.batch import Batch
×
23
from evadb.plan_nodes.groupby_plan import GroupByPlan
×
24

25

26
class GroupByExecutor(AbstractExecutor):
×
27
    """
28
    Group inputs into 4d segments of length provided in the query
29
    E.g., "GROUP BY '8 frames'" groups every 8 frames into one segment
30

31
    Arguments:
32
        node (AbstractPlan): The GroupBy Plan
33

34
    """
35

36
    def __init__(self, db: EvaDBDatabase, node: GroupByPlan):
×
37
        super().__init__(db, node)
×
38
        numbers_only = re.sub(r"\D", "", node.groupby_clause.value)
×
39
        self._segment_length = int(numbers_only)
×
40

41
    def exec(self, *args, **kwargs) -> Iterator[Batch]:
×
42
        child_executor = self.children[0]
×
43

44
        buffer = Batch(pd.DataFrame())
×
45
        for batch in child_executor.exec(**kwargs):
×
46
            new_batch = buffer + batch
×
47
            # We assume that all the segments exactly of segment_length size
48
            # and discard any dangling frames in the end.
49
            while len(new_batch) >= self._segment_length:
×
50
                yield new_batch[: self._segment_length]
×
51
                new_batch = new_batch[self._segment_length :]
×
52
            buffer = new_batch
×
STATUS · Troubleshooting · Open an Issue · Sales · Support · CAREERS · ENTERPRISE · START FREE · SCHEDULE DEMO
ANNOUNCEMENTS · TWITTER · TOS & SLA · Supported CI Services · What's a CI service? · Automated Testing

© 2025 Coveralls, Inc