org.apache.nifi.util.FlowFilePackagerV2 Maven / Gradle / Ivy
/*
* Licensed to the Apache Software Foundation (ASF) under one or more
* contributor license agreements. See the NOTICE file distributed with
* this work for additional information regarding copyright ownership.
* The ASF licenses this file to You under the Apache License, Version 2.0
* (the "License"); you may not use this file except in compliance with
* the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package org.apache.nifi.util;
import java.io.IOException;
import java.io.InputStream;
import java.io.OutputStream;
import java.util.Map;
/**
*
* Packages a FlowFile, including both its content and its attributes into a
* single file that is stream-friendly. The encoding scheme is as such:
*
*
*
* Length Field : indicates the number of Flow File Attributes in the stream
* 1 to N times (N=number of Flow File Attributes):
* String Field : Flow File Attribute key name
* String Field : Flow File Attribute value
* Long : 8 bytes indicating the length of the Flow File content
* Content : The next M bytes are the content of the Flow File.
*
*
*
* Encoding of String Field is as follows:
* Length Field : indicates the length of the String
* 1 to N bytes (N=String length, determined by previous field, as described above) : The UTF-8 encoded string value.
*
*
*
* Encoding of Length Field is as follows:
* First 2 bytes: Indicate length. If both bytes = 255, this is a special value indicating that the length is
* greater than or equal to 65536 bytes; therefore, the next 4 bytes will indicate the actual length.
*
*
*
* Note: All byte-order encoding is Network Byte Order (Most Significant Byte
* first)
*
*
*
* The following example shows the bytes expected if we were to encode a
* FlowFile containing the following attributes where the content is the text
* "Hello World!":
*
*
* Attributes:
*
* +-------+-------+
* | Key + Value |
* + --------------+
* | A | a |
* + --------------+
* | B | b |
* + --------------+
*
Content:
* Hello World!
*
* Packaged Byte Encoding (In Hexadecimal Form):
*
*
*
* 00 02 00 01 41 00 01 61
* 00 01 42 00 01 62 00 00
* 00 00 00 00 00 0C 48 65
* 6C 6C 6F 20 57 6F 72 6C
* 64 21
*
*/
public class FlowFilePackagerV2 implements FlowFilePackager {
private static final int MAX_VALUE_2_BYTES = 65535;
private final byte[] writeBuffer = new byte[8];
@Override
public void packageFlowFile(final InputStream in, final OutputStream out, final Map attributes, final long fileSize) throws IOException {
writeFieldLength(out, attributes.size()); //write out the number of attributes
for (final Map.Entry entry : attributes.entrySet()) { //write out each attribute key/value pair
writeString(entry.getKey(), out);
writeString(entry.getValue(), out);
}
writeLong(out, fileSize); //write out length of data
copy(in, out); //write out the actual flow file payload
}
private void copy(final InputStream in, final OutputStream out) throws IOException {
final byte[] buffer = new byte[65536];
int len;
while ((len = in.read(buffer)) > 0) {
out.write(buffer, 0, len);
}
}
private void writeString(final String val, final OutputStream out) throws IOException {
final byte[] bytes = val.getBytes("UTF-8");
writeFieldLength(out, bytes.length);
out.write(bytes);
}
private void writeFieldLength(final OutputStream out, final int numBytes) throws IOException {
// If the value is less than the max value that can be fit into 2 bytes, just use the
// actual value. Otherwise, we will set the first 2 bytes to 255/255 and then use the next
// 4 bytes to indicate the real length.
if (numBytes < MAX_VALUE_2_BYTES) {
writeBuffer[0] = (byte) (numBytes >>> 8);
writeBuffer[1] = (byte) (numBytes);
out.write(writeBuffer, 0, 2);
} else {
writeBuffer[0] = (byte) 0xff;
writeBuffer[1] = (byte) 0xff;
writeBuffer[2] = (byte) (numBytes >>> 24);
writeBuffer[3] = (byte) (numBytes >>> 16);
writeBuffer[4] = (byte) (numBytes >>> 8);
writeBuffer[5] = (byte) (numBytes);
out.write(writeBuffer, 0, 6);
}
}
private void writeLong(final OutputStream out, final long val) throws IOException {
writeBuffer[0] = (byte) (val >>> 56);
writeBuffer[1] = (byte) (val >>> 48);
writeBuffer[2] = (byte) (val >>> 40);
writeBuffer[3] = (byte) (val >>> 32);
writeBuffer[4] = (byte) (val >>> 24);
writeBuffer[5] = (byte) (val >>> 16);
writeBuffer[6] = (byte) (val >>> 8);
writeBuffer[7] = (byte) (val);
out.write(writeBuffer, 0, 8);
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy