All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.pulsar.functions.windowing.WindowManager Maven / Gradle / Ivy

There is a newer version: 4.0.0.4
Show newest version
/**
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *   http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing,
 * software distributed under the License is distributed on an
 * "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 * KIND, either express or implied.  See the License for the
 * specific language governing permissions and limitations
 * under the License.
 */
package org.apache.pulsar.functions.windowing;

import static org.apache.pulsar.functions.windowing.EvictionPolicy.Action.EXPIRE;
import static org.apache.pulsar.functions.windowing.EvictionPolicy.Action.PROCESS;
import static org.apache.pulsar.functions.windowing.EvictionPolicy.Action.STOP;

import java.util.ArrayList;
import java.util.Collection;
import java.util.HashSet;
import java.util.Iterator;
import java.util.List;
import java.util.Set;
import java.util.concurrent.atomic.AtomicInteger;
import java.util.concurrent.locks.ReentrantLock;

import lombok.extern.slf4j.Slf4j;

import org.apache.pulsar.functions.api.Record;

/**
 * Tracks a window of events and fires {@link WindowLifecycleListener} callbacks
 * on expiry of events or activation of the window due to {@link TriggerPolicy}.
 *
 * @param  the type of event in the window.
 */
@Slf4j
public class WindowManager implements TriggerHandler {

    /**
     * Expire old events every EXPIRE_EVENTS_THRESHOLD to
     * keep the window size in check.
     * 

* Note that if the eviction policy is based on watermarks, events will not be evicted until a new * watermark would cause them to be considered expired anyway, regardless of this limit */ protected static final int EXPIRE_EVENTS_THRESHOLD = 100; protected final Collection> queue; protected EvictionPolicy evictionPolicy; protected TriggerPolicy triggerPolicy; protected final WindowLifecycleListener> windowLifecycleListener; private final List> expiredEvents; private final Set> prevWindowEvents; private final AtomicInteger eventsSinceLastExpiry; private final ReentrantLock lock; /** * Constructs a {@link WindowManager} * * @param lifecycleListener the {@link WindowLifecycleListener} * @param queue a collection where the events in the window can be enqueued. *
* Note: This collection has to be thread safe. */ public WindowManager(WindowLifecycleListener> lifecycleListener, Collection> queue) { windowLifecycleListener = lifecycleListener; this.queue = queue; expiredEvents = new ArrayList<>(); prevWindowEvents = new HashSet<>(); eventsSinceLastExpiry = new AtomicInteger(); lock = new ReentrantLock(true); } public void setEvictionPolicy(EvictionPolicy evictionPolicy) { this.evictionPolicy = evictionPolicy; } public void setTriggerPolicy(TriggerPolicy triggerPolicy) { this.triggerPolicy = triggerPolicy; } /** * Add an event into the window, with the given ts as the tracking ts. * * @param event the event to track * @param ts the timestamp */ public void add(T event, long ts, Record record) { add(new EventImpl<>(event, ts, record)); } /** * Tracks a window event * * @param windowEvent the window event to track */ public void add(Event windowEvent) { // watermark events are not added to the queue. if (windowEvent.isWatermark()) { if (log.isDebugEnabled()) { log.debug("Got watermark event with ts {}", windowEvent.getTimestamp()); } } else { queue.add(windowEvent); } track(windowEvent); compactWindow(); } /** * The callback invoked by the trigger policy. */ @Override public boolean onTrigger() { List> windowEvents = null; List> expired = null; lock.lock(); try { /* * scan the entire window to handle out of order events in * the case of time based windows. */ windowEvents = scanEvents(true); expired = new ArrayList<>(expiredEvents); expiredEvents.clear(); } finally { lock.unlock(); } List> events = new ArrayList<>(); List> newEvents = new ArrayList<>(); for (Event event : windowEvents) { events.add(event); if (!prevWindowEvents.contains(event)) { newEvents.add(event); } } prevWindowEvents.clear(); if (!events.isEmpty()) { prevWindowEvents.addAll(windowEvents); if (log.isDebugEnabled()) { log.debug("invoking windowLifecycleListener onActivation, [{}] events in window.", events.size()); } windowLifecycleListener.onActivation(events, newEvents, expired, evictionPolicy.getContext().getReferenceTime()); } else { log.debug("No events in the window, skipping onActivation"); } triggerPolicy.reset(); return !events.isEmpty(); } public void shutdown() { log.debug("Shutting down WindowManager"); if (triggerPolicy != null) { triggerPolicy.shutdown(); } } /** * expires events that fall out of the window every * EXPIRE_EVENTS_THRESHOLD so that the window does not grow * too big. */ protected void compactWindow() { if (eventsSinceLastExpiry.incrementAndGet() >= EXPIRE_EVENTS_THRESHOLD) { scanEvents(false); } } /** * feed the event to the eviction and trigger policies * for bookkeeping and optionally firing the trigger. */ private void track(Event windowEvent) { evictionPolicy.track(windowEvent); triggerPolicy.track(windowEvent); } /** * Scan events in the queue, using the expiration policy to check * if the event should be evicted or not. * * @param fullScan if set, will scan the entire queue; if not set, will stop * as soon as an event not satisfying the expiration policy is found * @return the list of events to be processed as a part of the current window */ private List> scanEvents(boolean fullScan) { log.debug("Scan events, eviction policy {}", evictionPolicy); List> eventsToExpire = new ArrayList<>(); List> eventsToProcess = new ArrayList<>(); lock.lock(); try { Iterator> it = queue.iterator(); while (it.hasNext()) { Event windowEvent = it.next(); EvictionPolicy.Action action = evictionPolicy.evict(windowEvent); if (action == EXPIRE) { eventsToExpire.add(windowEvent); it.remove(); } else if (!fullScan || action == STOP) { break; } else if (action == PROCESS) { eventsToProcess.add(windowEvent); } } expiredEvents.addAll(eventsToExpire); } finally { lock.unlock(); } eventsSinceLastExpiry.set(0); if (log.isDebugEnabled()) { log.debug("[{}] events expired from window.", eventsToExpire.size()); } if (!eventsToExpire.isEmpty()) { log.debug("invoking windowLifecycleListener.onExpiry"); windowLifecycleListener.onExpiry(eventsToExpire); } return eventsToProcess; } /** * Scans the event queue and returns the next earliest event ts * between the startTs and endTs. * * @param startTs the start ts (exclusive) * @param endTs the end ts (inclusive) * @return the earliest event ts between startTs and endTs */ public long getEarliestEventTs(long startTs, long endTs) { long minTs = Long.MAX_VALUE; for (Event event : queue) { if (event.getTimestamp() > startTs && event.getTimestamp() <= endTs) { minTs = Math.min(minTs, event.getTimestamp()); } } return minTs; } /** * Scans the event queue and returns number of events having * timestamp less than or equal to the reference time. * * @param referenceTime the reference timestamp in millis * @return the count of events with timestamp less than or equal to referenceTime */ public int getEventCount(long referenceTime) { int count = 0; for (Event event : queue) { if (event.getTimestamp() <= referenceTime) { ++count; } } return count; } /** * Scans the event queue and returns the list of event ts * falling between startTs (exclusive) and endTs (inclusive) * at each sliding interval counts. * * @param startTs the start timestamp (exclusive) * @param endTs the end timestamp (inclusive) * @param slidingCount the sliding interval count * @return the list of event ts */ public List getSlidingCountTimestamps(long startTs, long endTs, int slidingCount) { List timestamps = new ArrayList<>(); if (endTs > startTs) { int count = 0; long ts = Long.MIN_VALUE; for (Event event : queue) { if (event.getTimestamp() > startTs && event.getTimestamp() <= endTs) { ts = Math.max(ts, event.getTimestamp()); if (++count % slidingCount == 0) { timestamps.add(ts); } } } } return timestamps; } @Override public String toString() { return "WindowManager{" + "evictionPolicy=" + evictionPolicy + ", triggerPolicy=" + triggerPolicy + '}'; } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy