All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.mycore.datamodel.language.MCRLanguageFactory Maven / Gradle / Ivy

There is a newer version: 2024.05
Show newest version
/*
 * This file is part of ***  M y C o R e  ***
 * See http://www.mycore.de/ for details.
 *
 * MyCoRe is free software: you can redistribute it and/or modify
 * it under the terms of the GNU General Public License as published by
 * the Free Software Foundation, either version 3 of the License, or
 * (at your option) any later version.
 *
 * MyCoRe is distributed in the hope that it will be useful,
 * but WITHOUT ANY WARRANTY; without even the implied warranty of
 * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
 * GNU General Public License for more details.
 *
 * You should have received a copy of the GNU General Public License
 * along with MyCoRe.  If not, see .
 */

package org.mycore.datamodel.language;

import java.util.Arrays;
import java.util.HashMap;
import java.util.Locale;
import java.util.Map;

import org.apache.logging.log4j.LogManager;
import org.apache.logging.log4j.Logger;
import org.mycore.backend.hibernate.MCRHIBConnection;
import org.mycore.common.MCRConstants;
import org.mycore.common.MCRSession;
import org.mycore.common.MCRSessionMgr;
import org.mycore.common.config.MCRConfiguration2;
import org.mycore.datamodel.classifications2.MCRCategory;
import org.mycore.datamodel.classifications2.MCRCategoryDAO;
import org.mycore.datamodel.classifications2.MCRCategoryDAOFactory;
import org.mycore.datamodel.classifications2.MCRCategoryID;
import org.mycore.datamodel.classifications2.MCRLabel;

/**
 * Returns MCRLanguage instances. The languages most commonly used, English and German,
 * are provided as constants. Other languages are read from a classification thats ID can be
 * configured using the property "MCR.LanguageClassification". That classification should use
 * ISO 639-1 code as category ID, where ISO 639-2 codes can be added by extra labels x-term and x-bibl
 * for the category. Unknown languages are created by code as required, but a warning is logged.
 *
 * @author Frank L\u00FCtzenkirchen
 */
public class MCRLanguageFactory {
    private static final Logger LOGGER = LogManager.getLogger();

    private static final MCRLanguageFactory SINGLETON = new MCRLanguageFactory();

    public static final MCRLanguage GERMAN = MCRLanguageFactory.instance().getLanguage("de");

    public static final MCRLanguage ENGLISH = MCRLanguageFactory.instance().getLanguage("en");

    /**
     * Map of languages by ISO 639-1 or -2 code
     */
    private Map languageByCode = new HashMap<>();

    /**
     * The ID of the classification containing the language codes and labels
     */
    private MCRCategoryID classification;

    private MCRCategoryDAO categoryDAO = MCRCategoryDAOFactory.getInstance();

    /**
     * Language classification may change at runtime, so we remember the time we last read the languages in.
     */
    private long classificationLastRead = Long.MIN_VALUE;

    /**
     * The default language is configured via "MCR.Metadata.DefaultLang"
     */
    private String codeOfDefaultLanguage;

    private MCRLanguageFactory() {
        codeOfDefaultLanguage = MCRConfiguration2.getString("MCR.Metadata.DefaultLang")
            .orElse(MCRConstants.DEFAULT_LANG);
        initDefaultLanguages();

        classification = MCRConfiguration2.getString("MCR.LanguageClassification")
            .map(MCRCategoryID::rootID)
            .orElse(null);
    }

    /**
     * Returns the MCRLanguageFactory singleton
     */
    public static MCRLanguageFactory instance() {
        return SINGLETON;
    }

    /**
     * Returns the default language, as configured by "MCR.Metadata.DefaultLang"
     */
    public MCRLanguage getDefaultLanguage() {
        return getLanguage(codeOfDefaultLanguage);
    }

    /**
     * Returns the language with the given ISO 639-1 or -2 code. When the given code contains a
     * subcode like "en-us", and the main language is configured, that main language is returned.
     * When the given code does not match any language configured, a language is created on-the-fly,
     * but a warning is logged.
     */
    public MCRLanguage getLanguage(String code) {
        if (classificationHasChanged()) {
            initLanguages();
        }

        return lookupLanguage(code);
    }

    private MCRLanguage lookupLanguage(String code) {
        if ((!languageByCode.containsKey(code)) && code.contains("-") && !code.startsWith("x-")) {
            code = code.split("-")[0];
        }

        if (!languageByCode.containsKey(code)) {
            LOGGER.warn("Unknown language: {}", code);
            buildLanguage(code, code.length() > 2 ? code : null, null);
        }

        return languageByCode.get(code);
    }

    /**
     * This method check the language string base on RFC 1766 to the supported
     * languages in MyCoRe in a current application environment. Without appending
     * this MCRLanguageFactory only ENGLISH and GERMAN are supported.
     *
     * @param code
     *            the language string in RFC 1766 syntax
     * @return true if the language code is supported. It return true too if the code starts
     *            with x- or i-, otherwise return false;
     */
    public final boolean isSupportedLanguage(String code) {
        if (code == null) {
            return false;
        }
        code = code.trim();
        if (code.length() == 0) {
            return false;
        }
        if (code.startsWith("x-") || code.startsWith("i-")) {
            return true;
        }
        return languageByCode.containsKey(code);
    }

    /**
     * Checks if any classification has changed in the persistent store, so that the languages
     * should be read again.
     */
    private boolean classificationHasChanged() {
        return MCRHIBConnection.isEnabled() && (classification != null)
            && (categoryDAO.getLastModified() > classificationLastRead);
    }

    /**
     * Builds the default languages and reads in the languages configured by classification
     */
    private void initLanguages() {
        languageByCode.clear();
        initDefaultLanguages();
        readLanguageClassification();
    }

    /**
     * Builds the default languages
     */
    private void initDefaultLanguages() {
        MCRLanguage de = buildLanguage("de", "deu", "ger");
        MCRLanguage en = buildLanguage("en", "eng", null);
        de.setLabel(de, "Deutsch");
        de.setLabel(en, "German");
        en.setLabel(de, "Englisch");
        en.setLabel(en, "English");
    }

    /**
     * Builds a new language object with the given ISO codes.
     *
     * @param xmlCode ISO 639-1 code as used for xml:lang
     * @param termCode ISO 639-2 terminologic code, may be null
     * @param biblCode ISO 639-2 bibliographical code, may be null
     */
    private MCRLanguage buildLanguage(String xmlCode, String termCode, String biblCode) {
        MCRLanguage language = new MCRLanguage();
        addCode(language, MCRLanguageCodeType.xmlCode, xmlCode);
        if (termCode != null) {
            addCode(language, MCRLanguageCodeType.termCode, termCode);
            addCode(language, MCRLanguageCodeType.biblCode, biblCode == null ? termCode : biblCode);
        }
        Locale locale = Arrays.stream(Locale.getAvailableLocales())
            .filter(l -> l.toString().equals(xmlCode))
            .findFirst()
            .orElseGet(() -> {
                String[] codeParts = xmlCode.split("_");
                switch (codeParts.length) {
                    case 1:
                        return new Locale(codeParts[0]);
                    case 2:
                        return new Locale(codeParts[0], codeParts[1]);
                    default:
                        return new Locale(codeParts[0], codeParts[1], codeParts[2]);
                }

            });
        language.setLocale(locale);
        return language;
    }

    /**
     * Adds and registers the code for the language
     */
    private void addCode(MCRLanguage language, MCRLanguageCodeType type, String code) {
        language.setCode(type, code);
        languageByCode.put(code, language);
    }

    /**
     * Reads in the language classification and builds language objects from its categories
     */
    private void readLanguageClassification() {
        MCRSession session = MCRSessionMgr.getCurrentSession();
        if (!session.isTransactionActive()) {
            session.beginTransaction();
            buildLanguagesFromClassification();
            session.commitTransaction();
        } else {
            buildLanguagesFromClassification();
        }
    }

    /**
     * Builds language objects from classification categories
     */
    private void buildLanguagesFromClassification() {
        this.classificationLastRead = categoryDAO.getLastModified();

        MCRCategory root = categoryDAO.getCategory(classification, -1);
        if (root == null) {
            LOGGER.warn("Language classification {} not found", classification.getRootID());
            return;
        }

        for (MCRCategory category : root.getChildren()) {
            buildLanguage(category);
        }
    }

    /**
     * Builds a new language object from the given category
     */
    private void buildLanguage(MCRCategory category) {
        String xmlCode = category.getId().getID();
        String termCode = category.getLabel("x-term").map(MCRLabel::getText).orElse(null);
        String biblCode = category.getLabel("x-bibl").map(MCRLabel::getText).orElse(termCode);

        MCRLanguage language = buildLanguage(xmlCode, termCode, biblCode);

        category
            .getLabels()
            .stream()
            .filter(l -> !l.getLang().startsWith("x-"))
            .sequential() //MCRLanguage is not thread safe
            .forEach(l -> {
                MCRLanguage languageOfLabel = lookupLanguage(l.getLang());
                language.setLabel(languageOfLabel, l.getText());
            });
    }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy