blob: 458d5290758051194aa797322e52e3328894154e [file] [log] [blame]
/**
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
#pragma once
#include <memory>
#include <optional>
#include <sstream>
#include <string>
#include <utility>
#include "S3Processor.h"
#include "aws/kinesis/KinesisClient.h"
#include "aws/kinesis/model/PutRecordsRequest.h"
#include "core/PropertyDefinitionBuilder.h"
#include "utils/ArrayUtils.h"
#include "utils/expected.h"
namespace org::apache::nifi::minifi::aws::processors {
class PutKinesisStream : public AwsProcessor { // NOLINT(cppcoreguidelines-special-member-functions)
public:
EXTENSIONAPI static constexpr const char* Description = "Sends the contents to a specified Amazon Kinesis. In order to send data to Kinesis, the stream name has to be specified.";
EXTENSIONAPI static constexpr auto AmazonKinesisStreamName = core::PropertyDefinitionBuilder<>::createProperty("Amazon Kinesis Stream Name")
.withDescription("The name of Kinesis Stream")
.isRequired(true)
.withValidator(core::StandardPropertyValidators::NON_BLANK_VALIDATOR)
.supportsExpressionLanguage(true)
.build();
EXTENSIONAPI static constexpr auto AmazonKinesisStreamPartitionKey = core::PropertyDefinitionBuilder<>::createProperty("Amazon Kinesis Stream Partition Key")
.withDescription("The partition key attribute. If it is not set, a random value is used")
.supportsExpressionLanguage(true)
.build();
EXTENSIONAPI static constexpr auto MessageBatchSize = core::PropertyDefinitionBuilder<>::createProperty("Batch Size")
.withDescription("Batch size for messages. [1-500]")
.withValidator(core::StandardPropertyValidators::UNSIGNED_INTEGER_VALIDATOR)
.withDefaultValue("250")
.build();
EXTENSIONAPI static constexpr auto MaxBatchDataSize = core::PropertyDefinitionBuilder<>::createProperty("Max Batch Data Size")
.withDescription("Soft cap on the data size of the batch to a single stream. (max 4MB)")
.withValidator(core::StandardPropertyValidators::DATA_SIZE_VALIDATOR)
.withDefaultValue("1 MB")
.build();
EXTENSIONAPI static constexpr auto Properties = minifi::utils::array_cat(AwsProcessor::Properties, std::to_array<core::PropertyReference>({
AmazonKinesisStreamName, AmazonKinesisStreamPartitionKey, MessageBatchSize, MaxBatchDataSize
}));
EXTENSIONAPI static constexpr auto Success = core::RelationshipDefinition{"success", "FlowFiles are routed to success relationship"};
EXTENSIONAPI static constexpr auto Failure = core::RelationshipDefinition{"failure", "FlowFiles are routed to failure relationship"};
EXTENSIONAPI static constexpr auto Relationships = std::array{Success, Failure};
EXTENSIONAPI static constexpr auto AwsKinesisErrorMessage = core::OutputAttributeDefinition<>{"aws.kinesis.error.message", { Failure },
"Error message on posting message to AWS Kinesis"};
EXTENSIONAPI static constexpr auto AwsKinesisErrorCode = core::OutputAttributeDefinition<>{"aws.kinesis.error.code", { Failure },
"Error code for the message when posting to AWS Kinesis"};
EXTENSIONAPI static constexpr auto AwsKinesisSequenceNumber = core::OutputAttributeDefinition<>{"aws.kinesis.sequence.number", { Success },
"Sequence number for the message when posting to AWS Kinesis"};
EXTENSIONAPI static constexpr auto AwsKinesisShardId = core::OutputAttributeDefinition<>{"aws.kinesis.shard.id", { Success },
"Shard id of the message posted to AWS Kinesis"};
EXTENSIONAPI static constexpr auto OutputAttributes = std::to_array<core::OutputAttributeReference>({
AwsKinesisErrorMessage,
AwsKinesisErrorCode,
AwsKinesisSequenceNumber,
AwsKinesisShardId});
EXTENSIONAPI static constexpr bool SupportsDynamicProperties = false;
EXTENSIONAPI static constexpr bool SupportsDynamicRelationships = false;
EXTENSIONAPI static constexpr auto InputRequirement = core::annotation::Input::INPUT_REQUIRED;
EXTENSIONAPI static constexpr bool IsSingleThreaded = false;
ADD_COMMON_VIRTUAL_FUNCTIONS_FOR_PROCESSORS
using AwsProcessor::AwsProcessor;
~PutKinesisStream() override = default;
void initialize() override;
void onSchedule(core::ProcessContext& context, core::ProcessSessionFactory& session_factory) override;
void onTrigger(core::ProcessContext& context, core::ProcessSession& session) override;
protected:
virtual std::unique_ptr<Aws::Kinesis::KinesisClient> getClient(const Aws::Auth::AWSCredentials& credentials);
private:
struct BatchItemResult {
std::string sequence_number;
std::string shard_id;
};
struct BatchItemError {
std::string error_message;
std::optional<std::string> error_code;
};
struct BatchItem {
std::shared_ptr<core::FlowFile> flow_file;
nonstd::expected<BatchItemResult, BatchItemError> result;
};
struct StreamBatch {
uint64_t batch_size = 0;
std::vector<BatchItem> items;
Aws::Kinesis::Model::PutRecordsRequest request;
};
nonstd::expected<Aws::Kinesis::Model::PutRecordsRequestEntry, BatchItemError> createEntryFromFlowFile(const core::ProcessContext& context,
core::ProcessSession& session,
const std::shared_ptr<core::FlowFile>& flow_file) const;
std::unordered_map<std::string, StreamBatch> createStreamBatches(const core::ProcessContext& context, core::ProcessSession& session) const;
void processBatch(StreamBatch& stream_batch, const Aws::Kinesis::KinesisClient& client) const;
static void transferFlowFiles(core::ProcessSession& session, const StreamBatch& stream_batch);
uint64_t batch_size_ = 250;
uint64_t batch_data_size_soft_cap_ = 1_MB;
const utils::AWSInitializer& AWS_INITIALIZER = utils::AWSInitializer::get();
std::optional<std::string> endpoint_override_url_;
};
} // namespace org::apache::nifi::minifi::aws::processors