All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.nifi.registry.util.FormatUtils Maven / Gradle / Ivy

/*
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
package org.apache.nifi.registry.util;

import java.text.NumberFormat;
import java.util.Arrays;
import java.util.List;
import java.util.concurrent.TimeUnit;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

public class FormatUtils {
    private static final String UNION = "|";

    // for Data Sizes
    private static final double BYTES_IN_KILOBYTE = 1024;
    private static final double BYTES_IN_MEGABYTE = BYTES_IN_KILOBYTE * 1024;
    private static final double BYTES_IN_GIGABYTE = BYTES_IN_MEGABYTE * 1024;
    private static final double BYTES_IN_TERABYTE = BYTES_IN_GIGABYTE * 1024;

    // for Time Durations
    private static final String NANOS = join(UNION, "ns", "nano", "nanos", "nanosecond", "nanoseconds");
    private static final String MILLIS = join(UNION, "ms", "milli", "millis", "millisecond", "milliseconds");
    private static final String SECS = join(UNION, "s", "sec", "secs", "second", "seconds");
    private static final String MINS = join(UNION, "m", "min", "mins", "minute", "minutes");
    private static final String HOURS = join(UNION, "h", "hr", "hrs", "hour", "hours");
    private static final String DAYS = join(UNION, "d", "day", "days");
    private static final String WEEKS = join(UNION, "w", "wk", "wks", "week", "weeks");

    private static final String VALID_TIME_UNITS = join(UNION, NANOS, MILLIS, SECS, MINS, HOURS, DAYS, WEEKS);
    public static final String TIME_DURATION_REGEX = "([\\d.]+)\\s*(" + VALID_TIME_UNITS + ")";
    public static final Pattern TIME_DURATION_PATTERN = Pattern.compile(TIME_DURATION_REGEX);
    private static final List TIME_UNIT_MULTIPLIERS = Arrays.asList(1000L, 1000L, 1000L, 60L, 60L, 24L);

    /**
     * Formats the specified count by adding commas.
     *
     * @param count the value to add commas to
     * @return the string representation of the given value with commas included
     */
    public static String formatCount(final long count) {
        return NumberFormat.getIntegerInstance().format(count);
    }

    /**
     * Formats the specified duration in 'mm:ss.SSS' format.
     *
     * @param sourceDuration the duration to format
     * @param sourceUnit     the unit to interpret the duration
     * @return representation of the given time data in minutes/seconds
     */
    public static String formatMinutesSeconds(final long sourceDuration, final TimeUnit sourceUnit) {
        final long millis = TimeUnit.MILLISECONDS.convert(sourceDuration, sourceUnit);

        final long millisInMinute = TimeUnit.MILLISECONDS.convert(1, TimeUnit.MINUTES);
        final int minutes = (int) (millis / millisInMinute);
        final long secondsMillisLeft = millis - minutes * millisInMinute;

        final long millisInSecond = TimeUnit.MILLISECONDS.convert(1, TimeUnit.SECONDS);
        final int seconds = (int) (secondsMillisLeft / millisInSecond);
        final long millisLeft = secondsMillisLeft - seconds * millisInSecond;

        return pad2Places(minutes) + ":" + pad2Places(seconds) + "." + pad3Places(millisLeft);
    }

    /**
     * Formats the specified duration in 'HH:mm:ss.SSS' format.
     *
     * @param sourceDuration the duration to format
     * @param sourceUnit     the unit to interpret the duration
     * @return representation of the given time data in hours/minutes/seconds
     */
    public static String formatHoursMinutesSeconds(final long sourceDuration, final TimeUnit sourceUnit) {
        final long millis = TimeUnit.MILLISECONDS.convert(sourceDuration, sourceUnit);

        final long millisInHour = TimeUnit.MILLISECONDS.convert(1, TimeUnit.HOURS);
        final int hours = (int) (millis / millisInHour);
        final long minutesSecondsMillisLeft = millis - hours * millisInHour;

        return pad2Places(hours) + ":" + formatMinutesSeconds(minutesSecondsMillisLeft, TimeUnit.MILLISECONDS);
    }

    private static String pad2Places(final long val) {
        return (val < 10) ? "0" + val : String.valueOf(val);
    }

    private static String pad3Places(final long val) {
        return (val < 100) ? "0" + pad2Places(val) : String.valueOf(val);
    }

    /**
     * Formats the specified data size in human readable format.
     *
     * @param dataSize Data size in bytes
     * @return Human readable format
     */
    public static String formatDataSize(final double dataSize) {
        // initialize the formatter
        final NumberFormat format = NumberFormat.getNumberInstance();
        format.setMaximumFractionDigits(2);

        // check terabytes
        double dataSizeToFormat = dataSize / BYTES_IN_TERABYTE;
        if (dataSizeToFormat > 1) {
            return format.format(dataSizeToFormat) + " TB";
        }

        // check gigabytes
        dataSizeToFormat = dataSize / BYTES_IN_GIGABYTE;
        if (dataSizeToFormat > 1) {
            return format.format(dataSizeToFormat) + " GB";
        }

        // check megabytes
        dataSizeToFormat = dataSize / BYTES_IN_MEGABYTE;
        if (dataSizeToFormat > 1) {
            return format.format(dataSizeToFormat) + " MB";
        }

        // check kilobytes
        dataSizeToFormat = dataSize / BYTES_IN_KILOBYTE;
        if (dataSizeToFormat > 1) {
            return format.format(dataSizeToFormat) + " KB";
        }

        // default to bytes
        return format.format(dataSize) + " bytes";
    }

    /**
     * Returns a time duration in the requested {@link TimeUnit} after parsing the {@code String}
     * input. If the resulting value is a decimal (i.e.
     * {@code 25 hours -> TimeUnit.DAYS = 1.04}), the value is rounded.
     * Use {@link #getPreciseTimeDuration(String, TimeUnit)} if fractional values are desirable
     *
     * @param value the raw String input (i.e. "28 minutes")
     * @param desiredUnit the requested output {@link TimeUnit}
     * @return the whole number value of this duration in the requested units
     * @see #getPreciseTimeDuration(String, TimeUnit)
     */
    public static long getTimeDuration(final String value, final TimeUnit desiredUnit) {
        return Math.round(getPreciseTimeDuration(value, desiredUnit));
    }

    /**
     * Returns the parsed and converted input in the requested units.
     * 

* If the value is {@code 0 <= x < 1} in the provided units, the units will first be converted to a smaller unit to get a value >= 1 (i.e. 0.5 seconds -> 500 milliseconds). * This is because the underlying unit conversion cannot handle decimal values. *

* If the value is {@code x >= 1} but x is not a whole number, the units will first be converted to a smaller unit to attempt to get a whole number value (i.e. 1.5 seconds -> 1500 milliseconds). *

* If the value is {@code x < 1000} and the units are {@code TimeUnit.NANOSECONDS}, the result will be a whole number of nanoseconds, rounded (i.e. 123.4 ns -> 123 ns). *

* This method handles decimal values over {@code 1 ns}, but {@code < 1 ns} will return {@code 0} in any other unit. *

* Examples: *

* "10 seconds", {@code TimeUnit.MILLISECONDS} -> 10_000.0 * "0.010 s", {@code TimeUnit.MILLISECONDS} -> 10.0 * "0.010 s", {@code TimeUnit.SECONDS} -> 0.010 * "0.010 ns", {@code TimeUnit.NANOSECONDS} -> 1 * "0.010 ns", {@code TimeUnit.MICROSECONDS} -> 0 * * @param value the {@code String} input * @param desiredUnit the desired output {@link TimeUnit} * @return the parsed and converted amount (without a unit) */ public static double getPreciseTimeDuration(final String value, final TimeUnit desiredUnit) { final Matcher matcher = TIME_DURATION_PATTERN.matcher(value.toLowerCase()); if (!matcher.matches()) { throw new IllegalArgumentException("Value '" + value + "' is not a valid time duration"); } final String duration = matcher.group(1); final String units = matcher.group(2); double durationVal = Double.parseDouble(duration); TimeUnit specifiedTimeUnit; // The TimeUnit enum doesn't have a value for WEEKS, so handle this case independently if (isWeek(units)) { specifiedTimeUnit = TimeUnit.DAYS; durationVal *= 7; } else { specifiedTimeUnit = determineTimeUnit(units); } // The units are now guaranteed to be in DAYS or smaller long durationLong; if (durationVal == Math.rint(durationVal)) { durationLong = Math.round(durationVal); } else { // Try reducing the size of the units to make the input a long List wholeResults = makeWholeNumberTime(durationVal, specifiedTimeUnit); durationLong = (long) wholeResults.get(0); specifiedTimeUnit = (TimeUnit) wholeResults.get(1); } return desiredUnit.convert(durationLong, specifiedTimeUnit); } /** * Converts the provided time duration value to one that can be represented as a whole number. * Returns a {@code List} containing the new value as a {@code long} at index 0 and the * {@link TimeUnit} at index 1. If the incoming value is already whole, it is returned as is. * If the incoming value cannot be made whole, a whole approximation is returned. For values * {@code >= 1 TimeUnit.NANOSECONDS}, the value is rounded (i.e. 123.4 ns -> 123 ns). * For values {@code < 1 TimeUnit.NANOSECONDS}, the constant [1L, {@code TimeUnit.NANOSECONDS}] is returned as the smallest measurable unit of time. *

* Examples: *

* 1, {@code TimeUnit.SECONDS} -> [1, {@code TimeUnit.SECONDS}] * 1.1, {@code TimeUnit.SECONDS} -> [1100, {@code TimeUnit.MILLISECONDS}] * 0.1, {@code TimeUnit.SECONDS} -> [100, {@code TimeUnit.MILLISECONDS}] * 0.1, {@code TimeUnit.NANOSECONDS} -> [1, {@code TimeUnit.NANOSECONDS}] * * @param decimal the time duration as a decimal * @param timeUnit the current time unit * @return the time duration as a whole number ({@code long}) and the smaller time unit used */ protected static List makeWholeNumberTime(double decimal, TimeUnit timeUnit) { // If the value is already a whole number, return it and the current time unit if (decimal == Math.rint(decimal)) { return Arrays.asList((long) decimal, timeUnit); } else if (TimeUnit.NANOSECONDS == timeUnit) { // The time unit is as small as possible if (decimal < 1.0) { decimal = 1; } else { decimal = Math.rint(decimal); } return Arrays.asList((long) decimal, timeUnit); } else { // Determine the next time unit and the respective multiplier TimeUnit smallerTimeUnit = getSmallerTimeUnit(timeUnit); long multiplier = calculateMultiplier(timeUnit, smallerTimeUnit); // Recurse with the original number converted to the smaller unit return makeWholeNumberTime(decimal * multiplier, smallerTimeUnit); } } /** * Returns the numerical multiplier to convert a value from {@code originalTimeUnit} to * {@code newTimeUnit} (i.e. for {@code TimeUnit.DAYS -> TimeUnit.MINUTES} would return * 24 * 60 = 1440). If the original and new units are the same, returns 1. If the new unit * is larger than the original (i.e. the result would be less than 1), throws an * {@link IllegalArgumentException}. * * @param originalTimeUnit the source time unit * @param newTimeUnit the destination time unit * @return the numerical multiplier between the units */ protected static long calculateMultiplier(TimeUnit originalTimeUnit, TimeUnit newTimeUnit) { if (originalTimeUnit == newTimeUnit) { return 1; } else if (originalTimeUnit.ordinal() < newTimeUnit.ordinal()) { throw new IllegalArgumentException("The original time unit '" + originalTimeUnit + "' must be larger than the new time unit '" + newTimeUnit + "'"); } else { int originalOrd = originalTimeUnit.ordinal(); int newOrd = newTimeUnit.ordinal(); List unitMultipliers = TIME_UNIT_MULTIPLIERS.subList(newOrd, originalOrd); return unitMultipliers.stream().reduce(1L, (a, b) -> (long) a * b); } } /** * Returns the next smallest {@link TimeUnit} (i.e. {@code TimeUnit.DAYS -> TimeUnit.HOURS}). * If the parameter is {@code null} or {@code TimeUnit.NANOSECONDS}, an * {@link IllegalArgumentException} is thrown because there is no valid smaller TimeUnit. * * @param originalUnit the TimeUnit * @return the next smaller TimeUnit */ protected static TimeUnit getSmallerTimeUnit(TimeUnit originalUnit) { if (originalUnit == null || TimeUnit.NANOSECONDS == originalUnit) { throw new IllegalArgumentException("Cannot determine a smaller time unit than '" + originalUnit + "'"); } else { return TimeUnit.values()[originalUnit.ordinal() - 1]; } } /** * Returns {@code true} if this raw unit {@code String} is parsed as representing "weeks", which does not have a value in the {@link TimeUnit} enum. * * @param rawUnit the String containing the desired unit * @return true if the unit is "weeks"; false otherwise */ protected static boolean isWeek(final String rawUnit) { switch (rawUnit) { case "w": case "wk": case "wks": case "week": case "weeks": return true; default: return false; } } /** * Returns the {@link TimeUnit} enum that maps to the provided raw {@code String} input. The * highest time unit is {@code TimeUnit.DAYS}. Any input that cannot be parsed will result in * an {@link IllegalArgumentException}. * * @param rawUnit the String to parse * @return the TimeUnit */ protected static TimeUnit determineTimeUnit(String rawUnit) { switch (rawUnit.toLowerCase()) { case "ns": case "nano": case "nanos": case "nanoseconds": return TimeUnit.NANOSECONDS; case "µs": case "micro": case "micros": case "microseconds": return TimeUnit.MICROSECONDS; case "ms": case "milli": case "millis": case "milliseconds": return TimeUnit.MILLISECONDS; case "s": case "sec": case "secs": case "second": case "seconds": return TimeUnit.SECONDS; case "m": case "min": case "mins": case "minute": case "minutes": return TimeUnit.MINUTES; case "h": case "hr": case "hrs": case "hour": case "hours": return TimeUnit.HOURS; case "d": case "day": case "days": return TimeUnit.DAYS; default: throw new IllegalArgumentException("Could not parse '" + rawUnit + "' to TimeUnit"); } } public static String formatUtilization(final double utilization) { return utilization + "%"; } private static String join(final String delimiter, final String... values) { if (values.length == 0) { return ""; } else if (values.length == 1) { return values[0]; } final StringBuilder sb = new StringBuilder(); sb.append(values[0]); for (int i = 1; i < values.length; i++) { sb.append(delimiter).append(values[i]); } return sb.toString(); } /** * Formats nanoseconds in the format: * 3 seconds, 8 millis, 3 nanos - if includeTotalNanos = false, * 3 seconds, 8 millis, 3 nanos (3008000003 nanos) - if includeTotalNanos = true * * @param nanos the number of nanoseconds to format * @param includeTotalNanos whether or not to include the total number of nanoseconds in parentheses in the returned value * @return a human-readable String that is a formatted representation of the given number of nanoseconds. */ public static String formatNanos(final long nanos, final boolean includeTotalNanos) { final StringBuilder sb = new StringBuilder(); final long seconds = nanos >= 1000000000L ? nanos / 1000000000L : 0L; long millis = nanos >= 1000000L ? nanos / 1000000L : 0L; final long nanosLeft = nanos % 1000000L; if (seconds > 0) { sb.append(seconds).append(" seconds"); } if (millis > 0) { if (seconds > 0) { sb.append(", "); millis -= seconds * 1000L; } sb.append(millis).append(" millis"); } if (seconds > 0 || millis > 0) { sb.append(", "); } sb.append(nanosLeft).append(" nanos"); if (includeTotalNanos) { sb.append(" (").append(nanos).append(" nanos)"); } return sb.toString(); } }