com.hazelcast.sql.impl.expression.datetime.Formatter Maven / Gradle / Ivy

Go to download

Show more of this group Show more artifacts with this name
Show all versions of hazelcast-sql Show documentation

SQL Parser and Optimizer

There is a newer version: 5.5.0

/*
 * Copyright 2024 Hazelcast Inc.
 *
 * Licensed under the Hazelcast Community License (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 * http://hazelcast.com/hazelcast-community-license
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package com.hazelcast.sql.impl.expression.datetime;

import com.hazelcast.sql.impl.QueryException;

import javax.annotation.Nonnull;
import java.math.BigDecimal;
import java.math.BigInteger;
import java.math.MathContext;
import java.math.RoundingMode;
import java.text.DecimalFormat;
import java.text.DecimalFormatSymbols;
import java.time.DayOfWeek;
import java.time.ZoneOffset;
import java.time.format.DateTimeFormatter;
import java.time.format.TextStyle;
import java.time.temporal.ChronoField;
import java.time.temporal.IsoFields;
import java.time.temporal.JulianFields;
import java.time.temporal.Temporal;
import java.time.temporal.TemporalField;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.Collections;
import java.util.List;
import java.util.Locale;
import java.util.function.BiFunction;
import java.util.regex.Matcher;
import java.util.regex.Pattern;

import static java.time.temporal.WeekFields.ISO;

/**
 *  Date/Time Formatting
 * 
 *  Pattern                      Description
 * 
 {@code HH}, {@code HH12}     hour of day (1–12)
 * 
 {@code HH24}                 hour of day (0–23)
 * 
 {@code MI}                   minute of hour (0–59)
 * 
 {@code SS}                   second of minute (0–59)
 * 
 {@code MS}, {@code FF3}      millisecond (0–999)
 * 
 {@code US}, {@code FF6}      microsecond (0–999999)
 * 
 {@code FF1}                  tenth of second (0–9)
 * 
 {@code FF2}                  hundredth of second (0–99)
 * 
 {@code FF4}                  tenth of a millisecond (0–9999)
 * 
 {@code FF5}                  hundredth of a millisecond (0–99999)
 * 
 {@code SSSS}, {@code SSSSS}  seconds past midnight (0–86399)
 * 
 {@code AM}, {@code am}, {@code PM}, {@code pm}
 *                                       meridiem indicator (without periods)
 * 
 {@code A.M.}, {@code a.m.}, {@code P.M.}, {@code p.m.}
 *                                       meridiem indicator (with periods)
 * 
 {@code Y,YYY}                year of era (4 or more digits) with comma
 * 
 {@code YYYY}                 year of era (4 or more digits)
 * 
 {@code YYY}                  last 3 digits of year of era
 * 
 {@code YY}                   last 2 digits of year of era
 * 
 {@code Y}                    last digit of year of era
 * 
 {@code IYYY}                 ISO 8601 week-numbering year (4 or more digits)
 * 
 {@code IYY}                  last 3 digits of ISO 8601 week-numbering year
 * 
 {@code IY}                   last 2 digits of ISO 8601 week-numbering year
 * 
 {@code I}                    last digit of ISO 8601 week-numbering year
 * 
 {@code BC}, {@code bc}, {@code AD}, {@code ad}
 *                                       era indicator (without periods)
 * 
 {@code B.C.}, {@code b.c.}, {@code A.D.}, {@code a.d.}
 *                                       era indicator (with periods)
 * 
 {@code MONTH}                full uppercase month name (space-padded to 9 chars)
 * 
 {@code Month}                full capitalized month name (space-padded to 9 chars)
 * 
 {@code month}                full lowercase month name (space-padded to 9 chars)
 * 
 {@code MON}                  abbreviated uppercase month name (3 chars in English,
 *                                           localized lengths vary)
 * 
 {@code Mon}                  abbreviated capitalized month name (3 chars in
 *                                           English, localized lengths vary)
 * 
 {@code mon}                  abbreviated lowercase month name (3 chars in English,
 *                                           localized lengths vary)
 * 
 {@code MM}                   month number (1–12)
 * 
 {@code DAY}                  full uppercase day name (space-padded to 9 chars)
 * 
 {@code Day}                  full capitalized day name (space-padded to 9 chars)
 * 
 {@code day}                  full lowercase day name (space-padded to 9 chars)
 * 
 {@code DY}                   abbreviated uppercase day name (3 chars in English,
 *                                           localized lengths vary)
 * 
 {@code Dy}                   abbreviated capitalized day name (3 chars in English,
 *                                           localized lengths vary)
 * 
 {@code dy}                   abbreviated lowercase day name (3 chars in English,
 *                                           localized lengths vary)
 * 
 {@code DDD}                  day of year (1–366)
 * 
 {@code IDDD}                 day of ISO 8601 week-numbering year (1–371; day 1 of
 *                                           the year is Monday of the first ISO week)
 * 
 {@code DD}                   day of month (1–31)
 * 
 {@code D}                    day of the week, Monday (1) to Sunday (7)
 * 
 {@code ID}                   ISO 8601 day of the week, Monday (1) to Sunday (7)
 * 
 {@code W}                    week of month (1–5) (the first week starts on the
 *                                           first day of the month)
 * 
 {@code WW}                   week number of year (1–53) (the first week starts on
 *                                           the first day of the year)
 * 
 {@code IW}                   week number of ISO 8601 week-numbering year (1–53; the
 *                                           first Thursday of the year is in week 1)
 * 
 {@code CC}                   century of era (2 digits) (the twenty-first century
 *                                           starts on 2001-01-01)
 * 
 {@code J}                    Julian Date (integer days since November 24, 4714 BC
 *                                           at local midnight)
 * 
 {@code Q}                    quarter of year (1-4)
 * 
 {@code RY}                   year of era in uppercase Roman numerals
 * 
 {@code ry}                   year of era in lowercase Roman numerals
 * 
 {@code RM}                   month number in uppercase Roman numerals (I–XII)
 * 
 {@code rm}                   month number in lowercase Roman numerals (i–xii)
 * 
 {@code RD}                   day of month in uppercase Roman numerals (I–XXXI)
 * 
 {@code rd}                   day of month in lowercase Roman numerals (i–xxxi)
 * 
 {@code TZ}                   uppercase time-zone abbreviation (e.g. GMT, UTC)
 * 
 {@code tz}                   lowercase time-zone abbreviation (e.g. gmt, utc)
 * 
 {@code TZH}                  time-zone hours (e.g. +3)
 * 
 {@code TZM}                  time-zone minutes (0-59)
 * 
 {@code OF}                   time-zone offset from UTC (e.g. +03:00)
 * 
 *
 * 
 *  Modifier           Description
 * 
 {@code FM} prefix  enable fill mode (suppress padding)
 * 
 {@code TH} suffix  uppercase ordinal number suffix (English only)
 * 
 {@code th} suffix  lowercase ordinal number suffix (English only)
 * 
 *
 * 
 Numeric Formatting
 * 
 *  Pattern             Description
 * 
 {@code 9}           digit position (can be dropped if insignificant)
 * 
 {@code 0}           digit position (will not be dropped, even if insignificant)
 * 
 {@code .} (period)  decimal separator
 * 
 {@code D}           localized decimal separator
 * 
 {@code ,} (comma)   grouping separator
 * 
 {@code G}           localized grouping separator
 * 
 {@code V}           shift specified number of digits (e.g. V99 = x10²)
 * 
 {@code TH}          uppercase ordinal suffix for the integer part (English only)
 * 
 {@code th}          lowercase ordinal suffix for the integer part (English only)
 * 
 {@code EEEE}        exponent for scientific notation (e.g. E+03, x10^+03)
 * 
 {@code eeee}        lowercase exponent for scientific notation (e.g. e+03, x10^+03)
 * 
 {@code RN}          uppercase Roman numeral for the integer part
 * 
 {@code rn}          lowercase Roman numeral for the integer part
 * 
 {@code FM}          enable fill mode (suppress padding)
 * 
 *
 * 
 *  Fixed       Anchored   Description
 * 
 {@code BR}  {@code B}  negative value in angle brackets
 * 
 {@code SG}  {@code S}  sign
 * 
 {@code MI}  {@code M}  minus sign if number is negative
 * 
 {@code PL}  {@code P}  plus sign if number is non-negative
 * 
 {@code CR}  {@code C}  currency symbol or ISO 4217 currency code
 * 
 *
 * 
 Notes 
 *  The format string consists of the integer and fraction parts, which are split at
 *      the first decimal separator, or just after the last digit position, or the end of the
 *      format string depending on availability. The order of processing is right-to-left in the
 *      integer part and left-to-right in the fraction part.
 * 
 If the format string contains {@code EEEE} or {@code eeee} patterns, it is said to be in
 *      the exponential form, in which no overflow is possible unless the number is
 *      infinite. If it contains {@code RN} or {@code rn} patterns and no digit positions, it is in
 *      the Roman form, in which there is an overflow unless number ∈ [1, 4000).
 *      Otherwise, the format string is in the normal form, in which the number overflows
 *      only if it requires more digit positions than specified for the integer part. In this form,
 *      {@code RN} and {@code rn} patterns format the integer part if |number| < 4000; otherwise,
 *      they switch to the overflow mode.
 * 
 In an overflow; digit positions print a single hash (#), {@code EEEE} and {@code eeee}
 *      patterns print +## as the exponent, {@code RN} and {@code rn} patterns print 15 hashes, and
 *      {@code TH} and {@code th} patterns print 2 spaces if the number is infinite. The other
 *      patterns print what they print when there is no overflow. Note that NaN (non-a-number) is
 *      considered positive.
 * 
 In the normal and exponential forms, if there is no negative sign provision and there is at
 *      least one digit position, an {@code M} pattern is prepended to the integer part. Similarly,
 *      if only one part has {@code BR} and/or {@code B} patterns, the latest bracket in the order
 *      of processing is inserted to the opposite part. The inferred sign is inserted so that it
 *      encloses all non-fixed patterns in the part to which it is inserted. 
 *
 * 
 General Notes 
 *  Lowercase variants of patterns are also accepted. If there is no special meaning of
 *      the lowercase variant, it has the same effect as its uppercase version.
 * 
 {@code FM} pattern enables the fill mode, which suppresses padding.
 *      In date formats: 
 *       If padding is enabled, numeric fields are left-padded with zeros and textual fields are
 *           left-padded with spaces.
 *      
 The padding space is printed immediately, i.e. it is not possible to float the fields
 *           to one side.
 *      
 *      In numeric formats: 
 *       If padding is enabled; {@code 9} pattern prints a single space if it corresponds to a
 *           leading/trailing zero, decimal/grouping separators print a single space if they are
 *           not in between digits, {@code TH} pattern prints 2 spaces if the number is infinite,
 *           {@code RN} pattern pads the Roman numeral to meet 15 characters, {@code BR} pattern
 *           prints 2 spaces if the number is non-negative, and {@code MI}/{@code PL} patterns
 *           print a single space if the number is non-negative/negative respectively.
 *      
 The padding space is not printed until a fixed pattern or the end of
 *           the format string is encountered. As a result, unfixed, or anchored,
 *           patterns float right within the extra space in the integer part and float left in the
 *           fraction part. Digit positions and decimal/grouping separators cannot float for
 *           obvious reasons, but they are considered "transparent" while anchoring other patterns.
 *      
 Zero-padding and space-padding are completely orthogonal, which makes it possible to
 *           have zero-padded fractions, which are aligned at the decimal separator. However, this
 *           requires the last digit of the fraction part to be {@code '0'} if the Postgres
 *           convention is desired. 
 * 
 Consecutive unrecognized characters are interpreted as a literal. It is
 *      also possible to specify a literal by enclosing zero or more characters within double
 *      quotes. If the format string ends before an opening quote is paired, a closing quote is
 *      assumed just after the last character. If a double quote is to be printed, it must be
 *      escaped with a leading backslash. In general, escaping a character causes it to lose its
 *      special meaning if any. In numeric formats, literals are anchored by default. To fix its
 *      position, a literal should be prepended with an {@code F} pattern, e.g. F$, F"USD". 
 */
@SuppressWarnings({"checkstyle:BooleanExpressionComplexity", "checkstyle:CyclomaticComplexity",
        "checkstyle:ExecutableStatementCount", "checkstyle:MagicNumber", "checkstyle:MethodLength",
        "checkstyle:NestedIfDepth", "checkstyle:NPathComplexity"})
public abstract class Formatter {
    private static final String ESCAPED = "\\\\.";
    private static final String LITERAL = "\"(?:" + ESCAPED + "|[^\"])*\"?|" + ESCAPED;
    private static final String DATETIME
            = "SSSSS?|HH(?:12|24)?|MI|[SMU]S|FF[1-6]|[AP](?:M|\\.M\\.)|"
            + "DA?Y|Da?y|I?DDD|DD|I?D|J|W|[WI]W|MON(?:TH)?|Mon(?:th)?|MM|Y,YYY|[YI]Y{0,3}|"
            + "Q|CC|BC|B\\.C\\.|AD|A\\.D\\.|R[DMY]|r[dmy]|TZ[HM]?|TZ|OF";
    private static final String NUMERIC
            = "[,G.D]|FM|BR?|SG?|MI?|PL?|CR?|V9+|TH|EEEE|RN";
    private static final Pattern DATETIME_TEMPLATE = Pattern.compile(
            "((?:FM|fm|TM|tm)*)(" + DATETIME + "|" + DATETIME.toLowerCase() + ")(TH|th)?|" + LITERAL);
    private static final Pattern NUMERIC_TEMPLATE = Pattern.compile(
            "[90]+|" + NUMERIC + "|" + NUMERIC.toLowerCase() + "|[Ff]?" + LITERAL);
    private static final Pattern SIGN = Pattern.compile("[+-]");

    private static final int[] ARABIC = {1000,  900, 500,  400, 100,   90,  50,   40,  10,    9,   5,    4,   1};
    private static final String[] ROMAN = {"M", "CM", "D", "CD", "C", "XC", "L", "XL", "X", "IX", "V", "IV", "I"};
    private static final String[] ORDINAL = {"th", "st", "nd", "rd", "th", "th", "th", "th", "th", "th"};

    public static Formatter forDates(@Nonnull String format) {
        return new DateFormat(format);
    }
    public static Formatter forNumbers(@Nonnull String format) {
        return new NumberFormat(format);
    }

    public abstract String format(@Nonnull Object input, @Nonnull Locale locale);

    interface GroupProcessor {
        void acceptLiteral(String literal);
        void acceptGroup(String group, Matcher m);
    }

    private static void parse(Pattern template, GroupProcessor processor, String format) {
        Matcher m = template.matcher(format);
        StringBuilder literal = new StringBuilder();
        int i = 0;
        for (; m.find(); i = m.end()) {
            if (m.start() > i) {
                literal.append(format, i, m.start());
            }
            String group = m.group();
            if (group.startsWith("\\")) {
                literal.append(group);
            } else {
                if (literal.length() > 0) {
                    processor.acceptLiteral(literal.toString());
                    literal.setLength(0);
                }
                processor.acceptGroup(group, m);
            }
        }
        if (i < m.regionEnd() || literal.length() > 0) {
            processor.acceptLiteral(literal + format.substring(i));
        }
    }

    private static > T valueOf(Class type, String name) {
        try {
            return Enum.valueOf(type, name);
        } catch (IllegalArgumentException e) {
            return Enum.valueOf(type, name.toUpperCase());
        }
    }

    /** Expects {@code |""?} where {@code LITERAL: (\.|[^"])*} */
    private static String unescape(String input) {
        StringBuilder s = new StringBuilder(input.length());
        for (int i = 0; i < input.length(); i++) {
            char c = input.charAt(i);
            if (c != '"') {
                if (c == '\\' && ++i < input.length()) {
                    c = input.charAt(i);
                }
                s.append(c);
            }
        }
        return s.toString();
    }

    private static String toRoman(int number) {
        StringBuilder s = new StringBuilder(15);
        if (number > 3999) {
            for (int i = 0; i < 15; i++) {
                s.append('#');
            }
        } else {
            for (int i = 0; i < ARABIC.length; i++) {
                for (; number >= ARABIC[i]; number -= ARABIC[i]) {
                    s.append(ROMAN[i]);
                }
            }
        }
        return s.toString();
    }

    private static String getOrdinal(String number) {
        return number.endsWith("11") || number.endsWith("12") || number.endsWith("13")
                ? "th" : ORDINAL[number.charAt(number.length() - 1) - '0'];
    }

    private static class DateFormat extends Formatter {
        static final DateTimeFormatter MERIDIEM_FORMATTER = DateTimeFormatter.ofPattern("a");
        static final DateTimeFormatter TIMEZONE_FORMATTER = DateTimeFormatter.ofPattern("O");
        static final DateTimeFormatter ERA_FORMATTER = DateTimeFormatter.ofPattern("G");

        static final BiFunction UPPERCASE = (o, l) -> ((String) o).toUpperCase(l);
        static final BiFunction LOWERCASE = (o, l) -> ((String) o).toLowerCase(l);
        static final BiFunction WITH_PERIODS = (o, l) -> {
            String r = (String) o;
            return r.length() != 2 ? r : r.charAt(0) + "." + r.charAt(1) + ".";
        };

        private final List parts = new ArrayList<>();

        interface Part {
            void format(StringBuilder s, Temporal input, Locale locale);
        }

        static class Literal implements Part {
            final String contents;

            Literal(String contents) {
                this.contents = unescape(contents);
            }

            @Override
            public void format(StringBuilder s, Temporal input, Locale locale) {
                s.append(contents);
            }

            @Override
            public String toString() {
                return '"' + contents + '"';
            }
        }

        static class PatternInstance implements Part {
            final boolean padding;
            final PatternElement pattern;
            final Ordinal ordinal;

            PatternInstance(boolean padding, PatternElement pattern, Ordinal ordinal) {
                this.padding = padding;
                this.pattern = pattern;
                this.ordinal = ordinal;
            }

            @Override
            public void format(StringBuilder s, Temporal input, Locale locale) {
                Object result = pattern.query.apply(input, locale);
                String r = result.toString();
                if (pattern == PatternElement.TZH) {
                    s.append((int) result < 0 ? '-' : '+');
                    r = (int) result < 0 ? r.substring(1) : r;
                }
                if (padding) {
                    char pad = result instanceof Number ? '0' : ' ';
                    for (int i = r.length(); i < pattern.maxLength; i++) {
                        s.append(pad);
                    }
                }
                s.append(r);
                if (pattern == PatternElement.Y_YYY && (padding || r.length() == 4)) {
                    s.insert(s.length() - 3, ',');
                }
                if (ordinal != null) {
                    String th = getOrdinal(r);
                    s.append(ordinal == Ordinal.TH ? th.toUpperCase() : th);
                }
            }

            @Override
            public String toString() {
                return pattern + (ordinal == null ? "" : ordinal.toString());
            }
        }

        @SuppressWarnings("checkstyle:MethodParamPad")
        enum PatternElement {
            HH12  (ChronoField.CLOCK_HOUR_OF_AMPM, 2), HH(HH12),
            HH24  (ChronoField.HOUR_OF_DAY, 2),
            MI    (ChronoField.MINUTE_OF_HOUR, 2),
            SS    (ChronoField.SECOND_OF_MINUTE, 2),
            MS    (ChronoField.MILLI_OF_SECOND, 3),
            US    (ChronoField.MICRO_OF_SECOND, 6),
            FF1   (MS, (r, l) -> (int) r / 100, 1),
            FF2   (MS, (r, l) -> (int) r / 10, 2),
            FF3   (MS),
            FF4   (US, (r, l) -> (int) r / 100, 4),
            FF5   (US, (r, l) -> (int) r / 10, 5),
            FF6   (US),
            SSSS  (ChronoField.SECOND_OF_DAY, 5), SSSSS (SSSS),
            AM    ((t, l) -> MERIDIEM_FORMATTER.withLocale(l).format(t), 2), PM(AM),
            am    (AM, LOWERCASE), pm(am),
            A_M_  (AM, WITH_PERIODS, 4), P_M_(A_M_),
            a_m_  (am, WITH_PERIODS), p_m_(a_m_),
            YYYY  (ChronoField.YEAR_OF_ERA, 4), Y_YYY(YYYY),
            YYY   (YYYY, (r, l) -> (int) r % 1000, 3),
            YY    (YYYY, (r, l) -> (int) r % 100, 2),
            Y     (YYYY, (r, l) -> (int) r % 10, 1),
            IYYY  (ISO.weekBasedYear(), 4),
            IYY   (IYYY, (r, l) -> (int) r % 1000, 3),
            IY    (IYYY, (r, l) -> (int) r % 100, 2),
            I     (IYYY, (r, l) -> (int) r % 10, 1),
            BC    ((t, l) -> ERA_FORMATTER.withLocale(l).format(t), 2), AD(BC),
            bc    (BC, LOWERCASE), ad(bc),
            B_C_  (BC, WITH_PERIODS, 4), A_D_(B_C_),
            b_c_  (bc, WITH_PERIODS), a_d_(b_c_),
            Month ((t, l) -> java.time.Month.from(t).getDisplayName(TextStyle.FULL, l), 9),
            MONTH (Month, UPPERCASE),
            month (Month, LOWERCASE),
            Mon   ((t, l) -> java.time.Month.from(t).getDisplayName(TextStyle.SHORT, l), 3),
            MON   (Mon, UPPERCASE),
            mon   (Mon, LOWERCASE),
            MM    (ChronoField.MONTH_OF_YEAR, 2),
            Day   ((t, l) -> DayOfWeek.from(t).getDisplayName(TextStyle.FULL, l), 9),
            DAY   (Day, UPPERCASE),
            day   (Day, LOWERCASE),
            Dy    ((t, l) -> DayOfWeek.from(t).getDisplayName(TextStyle.SHORT, l), 3),
            DY    (Dy, UPPERCASE),
            dy    (Dy, LOWERCASE),
            DDD   (ChronoField.DAY_OF_YEAR, 3),
            IDDD  ((t, l) -> (t.get(ISO.weekOfWeekBasedYear()) - 1) * 7 + t.get(ISO.dayOfWeek()), 3),
            DD    (ChronoField.DAY_OF_MONTH, 2),
            D     (ChronoField.DAY_OF_WEEK, 1),
            ID    (ISO.dayOfWeek(), 1),
            W     (ChronoField.ALIGNED_WEEK_OF_MONTH, 1),
            WW    (ChronoField.ALIGNED_WEEK_OF_YEAR, 2),
            IW    (ISO.weekOfWeekBasedYear(), 2),
            CC    ((t, l) -> (int) Math.ceil(t.get(ChronoField.YEAR_OF_ERA) / 100f), 2),
            J     ((t, l) -> t.getLong(JulianFields.JULIAN_DAY), 7),
            Q     (IsoFields.QUARTER_OF_YEAR, 1),
            RY    ((t, l) -> toRoman(t.get(ChronoField.YEAR_OF_ERA)), 15),
            ry    (RY, LOWERCASE),
            RM    ((t, l) -> toRoman(t.get(ChronoField.MONTH_OF_YEAR)), 4),
            rm    (RM, LOWERCASE),
            RD    ((t, l) -> toRoman(t.get(ChronoField.DAY_OF_MONTH)), 6),
            rd    (RD, LOWERCASE),
            TZ    ((t, l) -> SIGN.split(TIMEZONE_FORMATTER.withLocale(l).format(t))[0], 3),
            tz    (TZ, LOWERCASE),
            TZH   ((t, l) -> ZoneOffset.from(t).getTotalSeconds() / 3600, 2),
            TZM   ((t, l) -> (ZoneOffset.from(t).getTotalSeconds() % 3600) / 60, 2),
            OF    ((t, l) -> ZoneOffset.from(t).getId(), 6);

            final BiFunction query;
            final int maxLength;

            PatternElement(PatternElement pattern) {
                this(pattern.query, pattern.maxLength);
            }
            PatternElement(TemporalField field, int maxLength) {
                this((t, l) -> t.get(field), maxLength);
            }
            PatternElement(PatternElement pattern, BiFunction transform) {
                this(pattern, transform, pattern.maxLength);
            }
            PatternElement(PatternElement pattern, BiFunction transform, int maxLength) {
                this((t, l) -> transform.apply(pattern.query.apply(t, l), l), maxLength);
            }
            PatternElement(BiFunction query, int maxLength) {
                this.query = query;
                this.maxLength = maxLength;
            }
        }

        enum Ordinal { TH, th }

        class DateTimeGroupProcessor implements GroupProcessor {
            @Override
            public void acceptLiteral(String literal) {
                parts.add(new Literal(literal));
            }

            @Override
            public void acceptGroup(String group, Matcher m) {
                if (group.startsWith("\"")) {
                    parts.add(new Literal(group));
                } else {
                    String prefix = m.group(1).toUpperCase();
                    String pattern = m.group(2).replace('.', '_').replace(',', '_');
                    String suffix = m.group(3);
                    parts.add(new PatternInstance(!prefix.contains("FM"), valueOf(PatternElement.class, pattern),
                            suffix == null ? null : Ordinal.valueOf(suffix)));
                }
            }
        }

        DateFormat(String format) {
            parse(DATETIME_TEMPLATE, new DateTimeGroupProcessor(), format);
        }

        @Override
        public String format(@Nonnull Object input, @Nonnull Locale locale) {
            if (!(input instanceof Temporal)) {
                throw QueryException.dataException("Input parameter is expected to be date/time");
            }
            StringBuilder s = new StringBuilder();
            parts.forEach(p -> p.format(s, (Temporal) input, locale));
            return s.toString();
        }

        @Override
        public String toString() {
            return parts.toString();
        }
    }

    /**
     * This implementation does not leverage {@link DecimalFormat} or {@link java.util.Formatter}
     * because of the following reasons. 
     *  {@link DecimalFormat} does not fill the pattern space with #'s when the integer part
     *      overflows. Instead, it truncates the integer part, which cannot be checked without
     *      obtaining its decimal representation.
     * 
 {@link DecimalFormat} does not support multiple grouping sizes and separators.
     * 
 {@link DecimalFormat} rounds the fractional part using its binary representation, which
     *      produces wrong results even for simple cases such as (0.15 → #.# → 0.1) in {@link
     *      RoundingMode#HALF_UP}.
     * 
 {@link java.util.Formatter} does not cache or expose the intermediate representation of
     *      the format string.
     * 
 {@link java.util.Formatter} can correctly handle rounding by leveraging {@link
     *      sun.misc.FormattedFloatingDecimal} for {@link Float} and {@link Double}, and by using
     *      {@link BigDecimal#BigDecimal(BigInteger, int, MathContext) BigDecimal(BigInteger,
     *      scale, precision)}. Both {@link sun.misc.FormattedFloatingDecimal} and {@link
     *      BigDecimal} are using the decimal representation of floating point numbers, but for the
     *      former, the rounding mode is not configurable. 
     */
    private static class NumberFormat extends Formatter {
        private final Form form;
        private final Mask integerMask;
        private final Mask fractionMask;
        private final boolean padding;
        private final boolean currency;
        private final int shift;

        enum Form { Normal, Exponential, Roman }

        interface Anchorable {
            boolean isAnchored();
        }

        enum PatternElement implements Anchorable {
            BR, B, SG, S, MI, M, PL, P, CR, C, TH, th, EEEE, eeee, RN, rn;

            static final List SIGN = Arrays.asList(BR, B, SG, S, MI, M, PL, P);
            static final List NEGATIVE = Arrays.asList(BR, B, SG, S, MI, M);
            static final List ANCHORED = Arrays.asList(B, S, M, P, C, TH, th, EEEE, eeee, RN, rn);

            boolean isSign() {
                return SIGN.contains(this);
            }
            boolean isNegativeSign() {
                return NEGATIVE.contains(this);
            }
            char getSign(boolean pre, boolean negative) {
                if (this == BR || this == B) {
                    return negative ? (pre ? '<' : '>') : ' ';
                } else if (this == SG || this == S) {
                    return negative ? '-' : '+';
                } else if (this == MI || this == M) {
                    return negative ? '-' : ' ';
                } else if (this == PL || this == P) {
                    return negative ? ' ' : '+';
                }
                throw new IllegalArgumentException();
            }

            @Override
            public boolean isAnchored() {
                return ANCHORED.contains(this);
            }
        }

        static class Literal implements Anchorable {
            final String contents;
            final boolean anchored;

            Literal(String literal) {
                anchored = "Ff".indexOf(literal.charAt(0)) == -1;
                contents = unescape(literal.substring(anchored ? 0 : 1));
            }

            @Override
            public boolean isAnchored() {
                return anchored;
            }

            @Override
            public String toString() {
                return (anchored ? "" : "F") + '"' + contents + '"';
            }
        }

        /**
         * Stores {@link Literal}, {@link PatternElement}, {@link Character} and {@link Integer}
         * to represent arbitrary text, sign/currency/ordinals/exponent/roman numerals,
         * decimal/grouping separators, and digit groups respectively.
         */
        class Mask {
            final boolean pre;
            final List

Pattern	Description *
{@code HH}, {@code HH12}	hour of day (1–12) *
{@code HH24}	hour of day (0–23) *
{@code MI}	minute of hour (0–59) *
{@code SS}	second of minute (0–59) *
{@code MS}, {@code FF3}	millisecond (0–999) *
{@code US}, {@code FF6}	microsecond (0–999999) *
{@code FF1}	tenth of second (0–9) *
{@code FF2}	hundredth of second (0–99) *
{@code FF4}	tenth of a millisecond (0–9999) *
{@code FF5}	hundredth of a millisecond (0–99999) *
{@code SSSS}, {@code SSSSS}	seconds past midnight (0–86399) *
{@code AM}, {@code am}, {@code PM}, {@code pm} *	meridiem indicator (without periods) *
{@code A.M.}, {@code a.m.}, {@code P.M.}, {@code p.m.} *	meridiem indicator (with periods) *
{@code Y,YYY}	year of era (4 or more digits) with comma *
{@code YYYY}	year of era (4 or more digits) *
{@code YYY}	last 3 digits of year of era *
{@code YY}	last 2 digits of year of era *
{@code Y}	last digit of year of era *
{@code IYYY}	ISO 8601 week-numbering year (4 or more digits) *
{@code IYY}	last 3 digits of ISO 8601 week-numbering year *
{@code IY}	last 2 digits of ISO 8601 week-numbering year *
{@code I}	last digit of ISO 8601 week-numbering year *
{@code BC}, {@code bc}, {@code AD}, {@code ad} *	era indicator (without periods) *
{@code B.C.}, {@code b.c.}, {@code A.D.}, {@code a.d.} *	era indicator (with periods) *
{@code MONTH}	full uppercase month name (space-padded to 9 chars) *
{@code Month}	full capitalized month name (space-padded to 9 chars) *
{@code month}	full lowercase month name (space-padded to 9 chars) *
{@code MON}	abbreviated uppercase month name (3 chars in English, * localized lengths vary) *
{@code Mon}	abbreviated capitalized month name (3 chars in * English, localized lengths vary) *
{@code mon}	abbreviated lowercase month name (3 chars in English, * localized lengths vary) *
{@code MM}	month number (1–12) *
{@code DAY}	full uppercase day name (space-padded to 9 chars) *
{@code Day}	full capitalized day name (space-padded to 9 chars) *
{@code day}	full lowercase day name (space-padded to 9 chars) *
{@code DY}	abbreviated uppercase day name (3 chars in English, * localized lengths vary) *
{@code Dy}	abbreviated capitalized day name (3 chars in English, * localized lengths vary) *
{@code dy}	abbreviated lowercase day name (3 chars in English, * localized lengths vary) *
{@code DDD}	day of year (1–366) *
{@code IDDD}	day of ISO 8601 week-numbering year (1–371; day 1 of * the year is Monday of the first ISO week) *
{@code DD}	day of month (1–31) *
{@code D}	day of the week, Monday (1) to Sunday (7) *
{@code ID}	ISO 8601 day of the week, Monday (1) to Sunday (7) *
{@code W}	week of month (1–5) (the first week starts on the * first day of the month) *
{@code WW}	week number of year (1–53) (the first week starts on * the first day of the year) *
{@code IW}	week number of ISO 8601 week-numbering year (1–53; the * first Thursday of the year is in week 1) *
{@code CC}	century of era (2 digits) (the twenty-first century * starts on 2001-01-01) *
{@code J}	Julian Date (integer days since November 24, 4714 BC * at local midnight) *
{@code Q}	quarter of year (1-4) *
{@code RY}	year of era in uppercase Roman numerals *
{@code ry}	year of era in lowercase Roman numerals *
{@code RM}	month number in uppercase Roman numerals (I–XII) *
{@code rm}	month number in lowercase Roman numerals (i–xii) *
{@code RD}	day of month in uppercase Roman numerals (I–XXXI) *
{@code rd}	day of month in lowercase Roman numerals (i–xxxi) *
{@code TZ}	uppercase time-zone abbreviation (e.g. GMT, UTC) *
{@code tz}	lowercase time-zone abbreviation (e.g. gmt, utc) *
{@code TZH}	time-zone hours (e.g. +3) *
{@code TZM}	time-zone minutes (0-59) *
{@code OF}	time-zone offset from UTC (e.g. +03:00) *

Modifier	Description *
{@code FM} prefix	enable fill mode (suppress padding) *
{@code TH} suffix	uppercase ordinal number suffix (English only) *
{@code th} suffix	lowercase ordinal number suffix (English only) *

Pattern	Description *
{@code 9}	digit position (can be dropped if insignificant) *
{@code 0}	digit position (will not be dropped, even if insignificant) *
{@code .} (period)	decimal separator *
{@code D}	localized decimal separator *
{@code ,} (comma)	grouping separator *
{@code G}	localized grouping separator *
{@code V}	shift specified number of digits (e.g. V99 = x10²) *
{@code TH}	uppercase ordinal suffix for the integer part (English only) *
{@code th}	lowercase ordinal suffix for the integer part (English only) *
{@code EEEE}	exponent for scientific notation (e.g. E+03, x10^+03) *
{@code eeee}	lowercase exponent for scientific notation (e.g. e+03, x10^+03) *
{@code RN}	uppercase Roman numeral for the integer part *
{@code rn}	lowercase Roman numeral for the integer part *
{@code FM}	enable fill mode (suppress padding) *

Fixed	Anchored	Description *
{@code BR}	{@code B}	negative value in angle brackets *
{@code SG}	{@code S}	sign *
{@code MI}	{@code M}	minus sign if number is negative *
{@code PL}	{@code P}	plus sign if number is non-negative *
{@code CR}	{@code C}	currency symbol or ISO 4217 currency code *