All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.github.jscancella.reader.internal.KeyValueReader Maven / Gradle / Ivy

Go to download

This is a software library intended to support the creation, manipulation, and validation of "bags" from the bagit specification. It currently supports version 0.93 through 1.0.

There is a newer version: 5.2
Show newest version
package com.github.jscancella.reader.internal;

import java.io.BufferedReader;
import java.io.IOException;
import java.nio.charset.Charset;
import java.nio.file.Files;
import java.nio.file.Path;
import java.util.AbstractMap.SimpleImmutableEntry;
import java.util.ArrayList;
import java.util.List;
import java.util.ResourceBundle;

import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import org.slf4j.helpers.MessageFormatter;

import com.github.jscancella.exceptions.InvalidBagMetadataException;

/**
 * Convenience class for reading key value pairs from a file
 */
public enum KeyValueReader {;//using enum to enforce singleton
  private static final Logger logger = LoggerFactory.getLogger(KeyValueReader.class);
  private static final String INDENTED_LINE_REGEX = "^\\s+.*";
  private static final ResourceBundle messages = ResourceBundle.getBundle("MessageBundle");
  private static final int PARSED_LINE_LENGTH = 2; //since it is key: value there should only be two items per line after parsing

  /**
   * Generic method to read key value pairs from the bagit files, like bagit.txt or bag-info.txt
   * 
   * @param file the file to read
   * @param splitRegex how to split the key from the value
   * @param charset the encoding of the file
   * 
   * @return a list of key value pairs
   * 
   * @throws IOException if there was a problem reading the file
   * @throws InvalidBagMetadataException if the file does not conform to pattern of key value
   */
  @SuppressWarnings("PMD.AvoidInstantiatingObjectsInLoops")
  public static List> 
    readKeyValuesFromFile(final Path file, final String splitRegex, final Charset charset) throws IOException{
    
    final List> keyValues = new ArrayList<>();
    
    try(BufferedReader reader = Files.newBufferedReader(file, charset)){
      String line = reader.readLine();
      while(line != null){
        if(line.matches(INDENTED_LINE_REGEX) && !keyValues.isEmpty()){
          mergeIndentedLine(line, keyValues);
        }
        else{
          final String[] parts = checkLineFormat(line, splitRegex);
          final String key = parts[0].trim();
          final String value = parts[1].trim();
          logger.debug(messages.getString("read_key_value_line"), key, value, file, splitRegex);
          keyValues.add(new SimpleImmutableEntry<>(key, value));
        }
         
        line = reader.readLine();
      }
    }
    
    return keyValues;
  }
  
  /*
   * If a line is indented, it actually belongs with the previous line so we need to merge them together
   */
  private static void mergeIndentedLine(final String line, final List> keyValues){
    final SimpleImmutableEntry oldKeyValue = keyValues.remove(keyValues.size() -1);
    final SimpleImmutableEntry newKeyValue = new SimpleImmutableEntry<>(oldKeyValue.getKey(), oldKeyValue.getValue() + System.lineSeparator() +line);
    keyValues.add(newKeyValue);
    
    logger.debug(messages.getString("found_indented_line"), oldKeyValue.getKey());
  }
  
  private static String[] checkLineFormat(final String line, final String splitRegex){
    final String[] parts = line.split(splitRegex, PARSED_LINE_LENGTH);
    
    if(parts.length != PARSED_LINE_LENGTH){
      final String formattedMessage = messages.getString("malformed_key_value_line_error");
      throw new InvalidBagMetadataException(MessageFormatter.format(formattedMessage, line, splitRegex).getMessage());
    }
    
    return parts;
  }
}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy