kafka/streams/processor/stream_task.py


1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277

"""
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 * <p>
 * http://www.apache.org/licenses/LICENSE-2.0
 * <p>
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
"""
from __future__ import absolute_import

import logging
import threading

from kafka.consumer.fetcher import ConsumerRecord
import kafka.errors as Errors
from kafka.structs import OffsetAndMetadata
from .context import ProcessorContext
from .partition_group import PartitionGroup, RecordInfo
from .punctuation import PunctuationQueue
from .record_collector import RecordCollector
from .record_queue import RecordQueue
from .task import AbstractTask

NONEXIST_TOPIC = '__null_topic__'
DUMMY_RECORD = ConsumerRecord(NONEXIST_TOPIC, -1, -1, -1, -1, None, None, -1, -1, -1)

log = logging.getLogger(__name__)


class StreamTask(AbstractTask):
    """A StreamTask is associated with a PartitionGroup,
    and is assigned to a StreamThread for processing."""

    def __init__(self, task_id, partitions, topology, consumer, producer, restore_consumer, **config):
        """Create StreamTask with its assigned partitions

        Arguments:
            task_id (str): the ID of this task
            partitions (list of TopicPartition): the assigned partitions
            topology (ProcessorTopology): the instance of ProcessorTopology
            consumer (Consumer): the instance of Consumer
            producer (Producer): the instance of Producer
            restore_consumer (Consumer): the instance of Consumer used when
                restoring state
        """
        super(StreamTask, self).__init__(task_id, partitions, topology,
                                         consumer, restore_consumer, False, **config)
        self._punctuation_queue = PunctuationQueue()
        self._record_info = RecordInfo()

        self.max_buffered_size = config['buffered_records_per_partition']
        self._process_lock = threading.Lock()

        self._commit_requested = False
        self._commit_offset_needed = False
        self._curr_record = None
        self._curr_node = None
        self.requires_poll = True

        # create queues for each assigned partition and associate them
        # to corresponding source nodes in the processor topology
        partition_queues = {}

        for partition in partitions:
            source = self.topology.source(partition.topic())
            queue = self.create_record_queue(partition, source)
            partition_queues[partition] = queue

        self.partition_group = PartitionGroup(partition_queues, self.config['timestamp_extractor'])

        # initialize the consumed offset cache
        self.consumed_offsets = {}

        # create the record recordCollector that maintains the produced offsets
        self.record_collector = RecordCollector(self.producer)

        log.info('Creating restoration consumer client for stream task #%s', self.id)

        # initialize the topology with its own context
        self.processor_context = ProcessorContext(self.id, self, self.record_collector, self.state_mgr, **config)

        # initialize the state stores
        self.initialize_state_stores()

        # initialize the task by initializing all its processor nodes in the topology
        for node in self.topology.processors():
            self._curr_node = node
            try:
                node.init(self.processor_context)
            finally:
                self._curr_node = None

        self.processor_context.initialized()


    def add_records(self, partition, records):
        """Adds records to queues"""
        queue_size = self.partition_group.add_raw_records(partition, records)

        # if after adding these records, its partition queue's buffered size has
        # been increased beyond the threshold, we can then pause the consumption
        # for this partition
        if queue_size > self.max_buffered_size:
            self.consumer.pause(partition)

    def process(self):
        """Process one record

        Returns:
            number of records left in the buffer of this task's partition group after the processing is done
        """
        with self._process_lock:
            # get the next record to process
            timestamp, record = self.partition_group.next_record(self._record_info)

            # if there is no record to process, return immediately
            if record is None:
                self.requires_poll = True
                return 0

            self.requires_poll = False

            try:
                # process the record by passing to the source node of the topology
                self._curr_record = record
                self._curr_node = self._record_info.node()
                partition = self._record_info.partition()

                log.debug('Start processing one record [%s]', self._curr_record)

                self._curr_node.process(self._curr_record.key, self._curr_record.value)

                log.debug('Completed processing one record [%s]', self._curr_record)

                # update the consumed offset map after processing is done
                self.consumed_offsets[partition] = self._curr_record.offset
                self._commit_offset_needed = True

                # after processing this record, if its partition queue's
                # buffered size has been decreased to the threshold, we can then
                # resume the consumption on this partition
                if self._record_info.queue().size() == self.max_buffered_size:
                    self.consumer.resume(partition)
                    self.requires_poll = True

                if self.partition_group.top_queue_size() <= self.max_buffered_size:
                    self.requires_poll = True

            finally:
                self._curr_record = None
                self._curr_node = None

            return self.partition_group.num_buffered()

    def maybe_punctuate(self):
        """Possibly trigger registered punctuation functions if
        current partition group timestamp has reached the defined stamp
        """
        timestamp = self.partition_group.timestamp()

        # if the timestamp is not known yet, meaning there is not enough data
        # accumulated to reason stream partition time, then skip.
        if timestamp == -1:
            return False
        else:
            return self._punctuation_queue.may_punctuate(timestamp, self)

    def punctuate(self, node, timestamp):
        if self._curr_node is not None:
            raise Errors.IllegalStateError('Current node is not null')

        self._curr_node = node
        self._curr_record = (timestamp, DUMMY_RECORD)

        try:
            node.processor().punctuate(timestamp)
        finally:
            self._curr_node = None
            self._curr_record = None

    def record(self):
        return self._curr_record

    def node(self):
        return self._curr_node

    def commit(self):
        """Commit the current task state"""
        # 1) flush local state
        self.state_mgr.flush()

        # 2) flush produced records in the downstream and change logs of local states
        self.record_collector.flush()

        # 3) commit consumed offsets if it is dirty already
        if self._commit_offset_needed:
            consumed_offsets_and_metadata = {}
            for partition, offset in self.consumed_offsets.items():
                consumed_offsets_and_metadata[partition] = OffsetAndMetadata(offset + 1)
                self.state_mgr.put_offset_limit(partition, offset + 1)
            self.consumer.commit(consumed_offsets_and_metadata)
            self._commit_offset_needed = False

        self._commit_requested = False

    def commit_needed(self):
        """Whether or not a request has been made to commit the current state"""
        return self._commit_requested

    def need_commit(self):
        """Request committing the current task's state"""
        self._commit_requested = True

    def schedule(self, interval_ms):
        """Schedules a punctuation for the processor

        Arguments:
            interval_ms (int): the interval in milliseconds

        Raises: IllegalStateError if the current node is not None
        """
        if self._curr_node is None:
            raise Errors.IllegalStateError('Current node is null')

        schedule = (0, self._curr_node, interval_ms)
        self._punctuation_queue.schedule(schedule)

    def close(self):
        self.partition_group.close()
        self.consumed_offsets.clear()

        # close the processors
        # make sure close() is called for each node even when there is a RuntimeException
        exception = None
        for node in self.topology.processors():
            self._curr_node = node
            try:
                node.close()
            except RuntimeError as e:
                exception = e
            finally:
                self._curr_node = None

        super(StreamTask, self).close()

        if exception is not None:
            raise exception

    def record_collector_offsets(self):
        return self.record_collector.offsets()

    def _create_record_queue(self, partition, source):
        return RecordQueue(partition, source)

    def forward(self, key, value, child_index=None, child_name=None):
        this_node = self._curr_node
        try:
            children = this_node.children()

            if child_index is not None:
                children = [children[child_index]]
            elif child_name is not None:
                children = [child for child in children if child.name == child_name]

            for child_node in children:
                self._curr_node = child_node
                child_node.process(key, value)
        finally:
            self._curr_node = this_node