org.apache.pulsar.client.api.ProducerBuilder Maven / Gradle / Ivy
/**
* Licensed to the Apache Software Foundation (ASF) under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. The ASF licenses this file
* to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.apache.pulsar.client.api;
import java.util.Map;
import java.util.concurrent.CompletableFuture;
import java.util.concurrent.TimeUnit;
import org.apache.pulsar.client.api.PulsarClientException.ProducerQueueIsFullError;
import org.apache.pulsar.common.classification.InterfaceAudience;
import org.apache.pulsar.common.classification.InterfaceStability;
/**
* {@link ProducerBuilder} is used to configure and create instances of {@link Producer}.
*
* @see PulsarClient#newProducer()
* @see PulsarClient#newProducer(Schema)
*/
@InterfaceAudience.Public
@InterfaceStability.Stable
public interface ProducerBuilder extends Cloneable {
/**
* Finalize the creation of the {@link Producer} instance.
*
* This method will block until the producer is created successfully.
*
* @return the producer instance
* @throws PulsarClientException.ProducerBusyException
* if a producer with the same "producer name" is already connected to the topic
* @throws PulsarClientException
* if the producer creation fails
*/
Producer create() throws PulsarClientException;
/**
* Finalize the creation of the {@link Producer} instance in asynchronous mode.
*
* This method will return a {@link CompletableFuture} that can be used to access the instance when it's ready.
*
* @return a future that will yield the created producer instance
* @throws PulsarClientException.ProducerBusyException
* if a producer with the same "producer name" is already connected to the topic
* @throws PulsarClientException
* if the producer creation fails
*/
CompletableFuture> createAsync();
/**
* Load the configuration from provided config map.
*
* Example:
*
{@code
* Map config = new HashMap<>();
* config.put("producerName", "test-producer");
* config.put("sendTimeoutMs", 2000);
*
* ProducerBuilder builder = client.newProducer()
* .loadConf(config);
*
* Producer producer = builder.create();
* }
*
* @param config configuration map to load
* @return the producer builder instance
*/
ProducerBuilder loadConf(Map config);
/**
* Create a copy of the current {@link ProducerBuilder}.
*
* Cloning the builder can be used to share an incomplete configuration and specialize it multiple times. For
* example:
*
{@code
* ProducerBuilder builder = client.newProducer(Schema.STRING)
* .sendTimeout(10, TimeUnit.SECONDS)
* .blockIfQueueFull(true);
*
* Producer producer1 = builder.clone().topic("topic-1").create();
* Producer producer2 = builder.clone().topic("topic-2").create();
* }
*
* @return a clone of the producer builder instance
*/
ProducerBuilder clone();
/**
* Specify the topic this producer will be publishing on.
*
* This argument is required when constructing the produce.
*
* @param topicName the name of the topic
* @return the producer builder instance
*/
ProducerBuilder topic(String topicName);
/**
* Specify a name for the producer.
*
* If not assigned, the system will generate a globally unique name which can be accessed with
* {@link Producer#getProducerName()}.
*
*
Warning: When specifying a name, it is up to the user to ensure that, for a given topic,
* the producer name is unique across all Pulsar's clusters.
* Brokers will enforce that only a single producer a given name can be publishing on a topic.
*
* @param producerName
* the custom name to use for the producer
* @return the producer builder instance
*/
ProducerBuilder producerName(String producerName);
/**
* Set the send timeout (default: 30 seconds).
*
* If a message is not acknowledged by the server before the sendTimeout expires, an error will be reported.
*
*
Setting the timeout to zero, for example {@code setTimeout(0, TimeUnit.SECONDS)} will set the timeout
* to infinity, which can be useful when using Pulsar's message deduplication feature, since the client
* library will retry forever to publish a message. No errors will be propagated back to the application.
*
* @param sendTimeout
* the send timeout
* @param unit
* the time unit of the {@code sendTimeout}
* @return the producer builder instance
*/
ProducerBuilder sendTimeout(int sendTimeout, TimeUnit unit);
/**
* Set the max size of the queue holding the messages pending to receive an acknowledgment from the broker.
*
* When the queue is full, by default, all calls to {@link Producer#send} and {@link Producer#sendAsync}
* will fail unless {@code blockIfQueueFull=true}. Use {@link #blockIfQueueFull(boolean)}
* to change the blocking behavior.
*
*
The producer queue size also determines the max amount of memory that will be required by
* the client application. Until, the producer gets a successful acknowledgment back from the broker,
* it will keep in memory (direct memory pool) all the messages in the pending queue.
*
*
Default is 1000.
*
* @param maxPendingMessages
* the max size of the pending messages queue for the producer
* @return the producer builder instance
*/
ProducerBuilder maxPendingMessages(int maxPendingMessages);
/**
* Set the number of max pending messages across all the partitions.
*
* This setting will be used to lower the max pending messages for each partition
* ({@link #maxPendingMessages(int)}), if the total exceeds the configured value.
* The purpose of this setting is to have an upper-limit on the number
* of pending messages when publishing on a partitioned topic.
*
*
Default is 50000.
*
*
If publishing at high rate over a topic with many partitions (especially when publishing messages without a
* partitioning key), it might be beneficial to increase this parameter to allow for more pipelining within the
* individual partitions producers.
*
* @param maxPendingMessagesAcrossPartitions
* max pending messages across all the partitions
* @return the producer builder instance
*/
ProducerBuilder maxPendingMessagesAcrossPartitions(int maxPendingMessagesAcrossPartitions);
/**
* Set whether the {@link Producer#send} and {@link Producer#sendAsync} operations should block when the outgoing
* message queue is full.
*
* Default is {@code false}. If set to {@code false}, send operations will immediately fail with
* {@link ProducerQueueIsFullError} when there is no space left in pending queue. If set to
* {@code true}, the {@link Producer#sendAsync} operation will instead block.
*
*
Setting {@code blockIfQueueFull=true} simplifies the task of an application that
* just wants to publish messages as fast as possible, without having to worry
* about overflowing the producer send queue.
*
*
For example:
*
* Producer<String> producer = client.newProducer()
* .topic("my-topic")
* .blockIfQueueFull(true)
* .create();
*
* while (true) {
* producer.sendAsync("my-message")
* .thenAccept(messageId -> {
* System.out.println("Published message: " + messageId);
* })
* .exceptionally(ex -> {
* System.err.println("Failed to publish: " + e);
* return null;
* });
* }
*
*
* @param blockIfQueueFull
* whether to block {@link Producer#send} and {@link Producer#sendAsync} operations on queue full
* @return the producer builder instance
*/
ProducerBuilder blockIfQueueFull(boolean blockIfQueueFull);
/**
* Set the {@link MessageRoutingMode} for a partitioned producer.
*
* Default routing mode is to round-robin across the available partitions.
*
*
This logic is applied when the application is not setting a key on a
* particular message. If the key is set with {@link MessageBuilder#setKey(String)},
* then the hash of the key will be used to select a partition for the message.
*
* @param messageRoutingMode
* the message routing mode
* @return the producer builder instance
* @see MessageRoutingMode
*/
ProducerBuilder messageRoutingMode(MessageRoutingMode messageRoutingMode);
/**
* Change the {@link HashingScheme} used to chose the partition on where to publish a particular message.
*
* Standard hashing functions available are:
*
* - {@link HashingScheme#JavaStringHash}: Java {@code String.hashCode()} (Default)
*
- {@link HashingScheme#Murmur3_32Hash}: Use Murmur3 hashing function.
* https://en.wikipedia.org/wiki/MurmurHash
*
*
* @param hashingScheme
* the chosen {@link HashingScheme}
* @return the producer builder instance
*/
ProducerBuilder hashingScheme(HashingScheme hashingScheme);
/**
* Set the compression type for the producer.
*
* By default, message payloads are not compressed. Supported compression types are:
*
* - {@link CompressionType#NONE}: No compression (Default)
* - {@link CompressionType#LZ4}: Compress with LZ4 algorithm. Faster but lower compression than ZLib
* - {@link CompressionType#ZLIB}: Standard ZLib compression
* - {@link CompressionType#ZSTD} Compress with Zstandard codec. Since Pulsar 2.3. Zstd cannot be used if consumer
* applications are not in version >= 2.3 as well
* - {@link CompressionType#SNAPPY} Compress with Snappy codec. Since Pulsar 2.4. Snappy cannot be used if
* consumer applications are not in version >= 2.4 as well
*
*
* @param compressionType
* the selected compression type
* @return the producer builder instance
*/
ProducerBuilder compressionType(CompressionType compressionType);
/**
* Set a custom message routing policy by passing an implementation of MessageRouter.
*
* @param messageRouter
* @return the producer builder instance
*/
ProducerBuilder messageRouter(MessageRouter messageRouter);
/**
* Control whether automatic batching of messages is enabled for the producer. default: enabled
*
* When batching is enabled, multiple calls to {@link Producer#sendAsync} can result in a single batch
* to be sent to the broker, leading to better throughput, especially when publishing small messages.
* If compression is enabled, messages will be compressed at the batch level, leading to a much better
* compression ratio for similar headers or contents.
*
*
When enabled default batch delay is set to 1 ms and default batch size is 1000 messages
*
*
Batching is enabled by default since 2.0.0.
*
* @see #batchingMaxPublishDelay(long, TimeUnit)
* @see #batchingMaxMessages(int)
* @return the producer builder instance
*/
ProducerBuilder enableBatching(boolean enableBatching);
/**
* If message size is higher than allowed max publish-payload size by broker then enableChunking helps producer to
* split message into multiple chunks and publish them to broker separately and in order. So, it allows client to
* successfully publish large size of messages in pulsar.
*
* This feature allows publisher to publish large size of message by splitting it to multiple chunks and let
* consumer stitch them together to form a original large published message. Therefore, it's necessary to configure
* recommended configuration at pulsar producer and consumer. Recommendation to use this feature:
*
*
* 1. This feature is right now only supported by non-shared subscription and persistent-topic.
* 2. Disable batching to use chunking feature
* 3. Pulsar-client keeps published messages into buffer until it receives ack from broker.
* So, it's better to reduce "maxPendingMessages" size to avoid producer occupying large amount
* of memory by buffered messages.
* 4. Set message-ttl on the namespace to cleanup incomplete chunked messages.
* (sometime due to broker-restart or publish time, producer might fail to publish entire large message
* so, consumer will not be able to consume and ack those messages. So, those messages can
* be only discared by msg ttl) Or configure
* {@link ConsumerBuilder#expireTimeOfIncompleteChunkedMessage()}
* 5. Consumer configuration: consumer should also configure receiverQueueSize and maxPendingChuckedMessage
*
* @param enableChunking
* @return
*/
ProducerBuilder enableChunking(boolean enableChunking);
/**
* Sets a {@link CryptoKeyReader}.
*
* Configure the key reader to be used to encrypt the message payloads.
*
* @param cryptoKeyReader
* CryptoKeyReader object
* @return the producer builder instance
*/
ProducerBuilder cryptoKeyReader(CryptoKeyReader cryptoKeyReader);
/**
* Add public encryption key, used by producer to encrypt the data key.
*
* At the time of producer creation, Pulsar client checks if there are keys added to encryptionKeys. If keys are
* found, a callback {@link CryptoKeyReader#getPrivateKey(String, Map)} and
* {@link CryptoKeyReader#getPublicKey(String, Map)} is invoked against each key to load the values of the key.
* Application should implement this callback to return the key in pkcs8 format. If compression is enabled, message
* is encrypted after compression. If batch messaging is enabled, the batched message is encrypted.
*
* @param key
* the name of the encryption key in the key store
* @return the producer builder instance
*/
ProducerBuilder addEncryptionKey(String key);
/**
* Sets the ProducerCryptoFailureAction to the value specified.
*
* @param action
* the action the producer will take in case of encryption failures
* @return the producer builder instance
*/
ProducerBuilder cryptoFailureAction(ProducerCryptoFailureAction action);
/**
* Set the time period within which the messages sent will be batched default: 1 ms if batch messages are
* enabled. If set to a non zero value, messages will be queued until either:
*
* - this time interval expires
* - the max number of messages in a batch is reached ({@link #batchingMaxMessages(int)})
*
- the max size of batch is reached
*
*
* All messages will be published as a single batch message. The consumer will be delivered individual
* messages in the batch in the same order they were enqueued.
*
* @param batchDelay
* the batch delay
* @param timeUnit
* the time unit of the {@code batchDelay}
* @return the producer builder instance
* @see #batchingMaxMessages(int)
* @see #batchingMaxBytes(int)
*/
ProducerBuilder batchingMaxPublishDelay(long batchDelay, TimeUnit timeUnit);
/**
* Set the partition switch frequency while batching of messages is enabled and
* using round-robin routing mode for non-keyed message default: 10.
*
* The time period of partition switch is frequency * batchingMaxPublishDelay. During this period,
* all messages arrives will be route to the same partition.
*
* @param frequency the frequency of partition switch
* @return the producer builder instance
* @see #messageRoutingMode(MessageRoutingMode)
* @see #batchingMaxPublishDelay(long, TimeUnit)
*/
ProducerBuilder roundRobinRouterBatchingPartitionSwitchFrequency(int frequency);
/**
* Set the maximum number of messages permitted in a batch. default: 1000 If set to a value greater than 1,
* messages will be queued until this threshold is reached or batch interval has elapsed.
*
* All messages in batch will be published as a single batch message. The consumer will be delivered individual
* messages in the batch in the same order they were enqueued.
*
* @param batchMessagesMaxMessagesPerBatch
* maximum number of messages in a batch
* @return the producer builder instance
* @see #batchingMaxPublishDelay(long, TimeUnit)
* @see #batchingMaxBytes(int)
*/
ProducerBuilder batchingMaxMessages(int batchMessagesMaxMessagesPerBatch);
/**
* Set the maximum number of bytes permitted in a batch. default: 128KB
* If set to a value greater than 0, messages will be queued until this threshold is reached
* or other batching conditions are met.
*
* All messages in a batch will be published as a single batched message. The consumer will be delivered
* individual messages in the batch in the same order they were enqueued.
*
* @param batchingMaxBytes maximum number of bytes in a batch
* @return the producer builder instance
* @see #batchingMaxPublishDelay(long, TimeUnit)
* @see #batchingMaxMessages(int)
*/
ProducerBuilder batchingMaxBytes(int batchingMaxBytes);
/**
* Set the batcher builder {@link BatcherBuilder} of the producer. Producer will use the batcher builder to
* build a batch message container.This is only be used when batching is enabled.
*
* @param batcherBuilder
* batcher builder
* @return the producer builder instance
*/
ProducerBuilder batcherBuilder(BatcherBuilder batcherBuilder);
/**
* Set the baseline for the sequence ids for messages published by the producer.
*
* First message will be using {@code (initialSequenceId + 1)} as its sequence id and
* subsequent messages will be assigned incremental sequence ids, if not otherwise specified.
*
* @param initialSequenceId the initial sequence id for the producer
* @return the producer builder instance
*/
ProducerBuilder initialSequenceId(long initialSequenceId);
/**
* Set a name/value property with this producer.
*
* Properties are application defined metadata that can be attached to the producer.
* When getting the topic stats, this metadata will be associated to the producer
* stats for easier identification.
*
* @param key
* the property key
* @param value
* the property value
* @return the producer builder instance
*/
ProducerBuilder property(String key, String value);
/**
* Add all the properties in the provided map to the producer.
*
* Properties are application defined metadata that can be attached to the producer.
* When getting the topic stats, this metadata will be associated to the producer
* stats for easier identification.
*
* @param properties the map of properties
* @return the producer builder instance
*/
ProducerBuilder properties(Map properties);
/**
* Add a set of {@link ProducerInterceptor} to the producer.
*
* Interceptors can be used to trace the publish and acknowledgments operation happening in a producer.
*
* @param interceptors
* the list of interceptors to intercept the producer created by this builder.
* @return the producer builder instance
*/
@Deprecated
ProducerBuilder intercept(ProducerInterceptor ... interceptors);
/**
* Add a set of {@link org.apache.pulsar.client.api.interceptor.ProducerInterceptor} to the producer.
*
* Interceptors can be used to trace the publish and acknowledgments operation happening in a producer.
*
* @param interceptors
* the list of interceptors to intercept the producer created by this builder.
* @return the producer builder instance
*/
ProducerBuilder intercept(org.apache.pulsar.client.api.interceptor.ProducerInterceptor... interceptors);
/**
* If enabled, partitioned producer will automatically discover new partitions at runtime. This is only applied on
* partitioned topics.
*
* Default is true.
*
* @param autoUpdate
* whether to auto discover the partition configuration changes
* @return the producer builder instance
*/
ProducerBuilder autoUpdatePartitions(boolean autoUpdate);
/**
* Set the interval of updating partitions (default: 1 minute). This only works if autoUpdatePartitions is
* enabled.
*
* @param interval
* the interval of updating partitions
* @param unit
* the time unit of the interval.
* @return the producer builder instance
*/
ProducerBuilder autoUpdatePartitionsInterval(int interval, TimeUnit unit);
/**
* Control whether enable the multiple schema mode for producer.
* If enabled, producer can send a message with different schema from that specified just when it is created,
* otherwise a invalid message exception would be threw
* if the producer want to send a message with different schema.
*
* Enabled by default.
*
* @param multiSchema
* indicates to enable or disable multiple schema mode
* @return the producer builder instance
* @since 2.5.0
*/
ProducerBuilder enableMultiSchema(boolean multiSchema);
}