com.conveyal.gtfs.loader.Feed Maven / Gradle / Ivy
package com.conveyal.gtfs.loader;
import com.conveyal.gtfs.error.GTFSError;
import com.conveyal.gtfs.error.NewGTFSError;
import com.conveyal.gtfs.error.SQLErrorStorage;
import com.conveyal.gtfs.model.*;
import com.conveyal.gtfs.storage.StorageException;
import com.conveyal.gtfs.validator.*;
import com.google.common.collect.Multimap;
import com.google.common.collect.Multimaps;
import org.slf4j.Logger;
import org.slf4j.LoggerFactory;
import javax.sql.DataSource;
import java.sql.Connection;
import java.sql.SQLException;
import java.sql.Statement;
import java.time.DayOfWeek;
import java.time.LocalDate;
import java.util.ArrayList;
import java.util.Arrays;
import java.util.List;
import static com.conveyal.gtfs.error.NewGTFSErrorType.VALIDATOR_FAILED;
/**
* This connects to an SQL RDBMS containing GTFS data and lets you fetch elements out of it.
*/
public class Feed {
private static final Logger LOG = LoggerFactory.getLogger(Feed.class);
private final DataSource dataSource;
// The unique database schema name for this particular feed, including the separator charater (dot).
// This may be the empty string if the feed is stored in the root ("public") schema.
public final String tablePrefix;
public final TableReader agencies;
public final TableReader calendars;
public final TableReader calendarDates;
// public final TableReader fares;
public final TableReader routes;
public final TableReader stops;
public final TableReader trips;
public final TableReader shapePoints;
public final TableReader stopTimes;
/* A place to accumulate errors while the feed is loaded. Tolerate as many errors as possible and keep on loading. */
// TODO remove this and use only NewGTFSErrors in Validators, loaded into a JDBC table
public final List errors = new ArrayList<>();
/**
* Create a feed that reads tables over a JDBC connection. The connection should already be set to the right
* schema within the database.
* @param tablePrefix the unique prefix for the table (may be null for no prefix)
*/
public Feed (DataSource dataSource, String tablePrefix) {
this.dataSource = dataSource;
// Ensure separator dot is present
if (tablePrefix != null && !tablePrefix.endsWith(".")) tablePrefix += ".";
this.tablePrefix = tablePrefix == null ? "" : tablePrefix;
agencies = new JDBCTableReader(Table.AGENCY, dataSource, tablePrefix, EntityPopulator.AGENCY);
// fares = new JDBCTableReader(Table.FARES, dataSource, tablePrefix, EntityPopulator.FARE);
calendars = new JDBCTableReader(Table.CALENDAR, dataSource, tablePrefix, EntityPopulator.CALENDAR);
calendarDates = new JDBCTableReader(Table.CALENDAR_DATES, dataSource, tablePrefix, EntityPopulator.CALENDAR_DATE);
routes = new JDBCTableReader(Table.ROUTES, dataSource, tablePrefix, EntityPopulator.ROUTE);
stops = new JDBCTableReader(Table.STOPS, dataSource, tablePrefix, EntityPopulator.STOP);
trips = new JDBCTableReader(Table.TRIPS, dataSource, tablePrefix, EntityPopulator.TRIP);
shapePoints = new JDBCTableReader(Table.SHAPES, dataSource, tablePrefix, EntityPopulator.SHAPE_POINT);
stopTimes = new JDBCTableReader(Table.STOP_TIMES, dataSource, tablePrefix, EntityPopulator.STOP_TIME);
}
/**
* TODO check whether validation has already occurred, overwrite results.
* TODO allow validation within feed loading process, so the same connection can be used, and we're certain loaded data is 100% visible.
* That would also avoid having to reconnect the error storage to the DB.
*/
public ValidationResult validate () {
long validationStartTime = System.currentTimeMillis();
// Create an empty validation result that will have its fields populated by certain validators.
ValidationResult validationResult = new ValidationResult();
// Error tables should already be present from the initial load.
// Reconnect to the existing error tables.
SQLErrorStorage errorStorage = null;
try {
errorStorage = new SQLErrorStorage(dataSource.getConnection(), tablePrefix, false);
} catch (SQLException e) {
throw new StorageException(e);
}
int errorCountBeforeValidation = errorStorage.getErrorCount();
List feedValidators = Arrays.asList(
new MisplacedStopValidator(this, errorStorage, validationResult),
new DuplicateStopsValidator(this, errorStorage),
new TimeZoneValidator(this, errorStorage),
new NewTripTimesValidator(this, errorStorage),
new NamesValidator(this, errorStorage));
for (FeedValidator feedValidator : feedValidators) {
String validatorName = feedValidator.getClass().getSimpleName();
try {
LOG.info("Running {}.", validatorName);
int errorCountBefore = errorStorage.getErrorCount();
// todo why not just pass the feed and errorstorage in here?
feedValidator.validate();
LOG.info("{} found {} errors.", validatorName, errorStorage.getErrorCount() - errorCountBefore);
} catch (Exception e) {
// store an error if the validator fails
// FIXME: should the exception be stored?
errorStorage.storeError(NewGTFSError.forFeed(VALIDATOR_FAILED, validatorName));
LOG.error("{} failed.", validatorName);
LOG.error(e.toString());
e.printStackTrace();
}
}
// Signal to all validators that validation is complete and allow them to report on results / status.
for (FeedValidator feedValidator : feedValidators) {
feedValidator.complete(validationResult);
}
int totalValidationErrors = errorStorage.getErrorCount() - errorCountBeforeValidation;
LOG.info("Total number of errors found by all validators: {}", totalValidationErrors);
errorStorage.commitAndClose();
long validationEndTime = System.currentTimeMillis();
long totalValidationTime = validationEndTime - validationStartTime;
LOG.info("{} validators completed in {} milliseconds.", feedValidators.size(), totalValidationTime);
// update validation result fields
validationResult.errorCount = totalValidationErrors;
validationResult.validationTime = totalValidationTime;
// FIXME: Validation result date and int[] fields need to be set somewhere.
return validationResult;
}
/**
* @return a JDBC connection to the database underlying this Feed.
*/
public Connection getConnection() throws SQLException {
return dataSource.getConnection();
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy