io.spring.nohttp.RegexPredicate Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of nohttp Show documentation
nohttp
The newest version!
/*
 * Copyright 2002-2019 the original author or authors.
 *
 * Licensed under the Apache License, Version 2.0 (the "License");
 * you may not use this file except in compliance with the License.
 * You may obtain a copy of the License at
 *
 *      https://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package io.spring.nohttp;

import java.io.BufferedReader;
import java.io.IOException;
import java.io.InputStream;
import java.io.InputStreamReader;
import java.util.List;
import java.util.function.Predicate;
import java.util.regex.Pattern;
import java.util.stream.Collectors;

/**
 * An API that is typically used with {@link RegexHttpMatcher} that allows
 * http text using a provided list of {@link Pattern}s.
 *
 * @author Rob Winch
 * @see RegexHttpMatcher
 * @see #createPatternsFromInputStream(InputStream)
 */
public class RegexPredicate implements Predicate {
	private final List patterns;

	/**
	 * Creates an allowlist with the provided {@link Pattern}s
	 * @param patterns the patterns to use.
	 */
	public RegexPredicate(List patterns) {
		if (patterns == null) {
			throw new IllegalArgumentException("patterns cannot be null");
		}
		if (patterns.isEmpty()) {
			throw new IllegalArgumentException("patterns cannot be empty");
		}
		this.patterns = patterns;
	}

	@Override
	public boolean test(String httpText) {
		return this.patterns.stream()
				.anyMatch(p -> p.matcher(httpText).matches());
	}

	/**
	 * Creates an instance that uses the default URL allowlist. The allowlist is expected to
	 * be updated in upcoming releases, but generally contains
	 *
	 * 
	 *     localhost
	 *     URLs that use a TLD defined in https://tools.ietf.org/html/rfc2606 (i.e. tld of test, .example, invalid, localhost)
	 *     XML Namespace names (not the locations)
	 *     Java specific URLs that do not work over http. For example, Java Properties
	 *     hard codes using http.
	 *     
	 * 
	 * @return the {@link Predicate} that determines what is allowed
 	 */
	public static Predicate createDefaultUrlAllowlist() {
		InputStream resource = RegexPredicate.class.getResourceAsStream("allowlist.txt");
		return createAllowlistFromPatterns(resource);
	}

	/**
	 * Creates a {@link Predicate} from an {@link InputStream}.
	 * The format of the {@link InputStream} contains regular expressions of what inputs
	 * should be allowed such that:
	 *
	 * 
	 *     Each line contains a regular expression that should be allowed
	 *     Lines can begin with // to create a comment within the file
	 *     Lines are trimmed for whitespace
	 *     Lines that are empty are ignored
	 * 
	 *
	 * An example file can be found below:
	 *
	 * 	 * // Ignore Maven XML Namespace id of http://maven.apache.org/POM/4.0.0
	 * ^http://maven\.apache\.org/POM/4.0.0$
	 * // Allow Company XML namespace names but not the locations (which end in .xsd)
	 * ^http://mycompany.test/xml/.*(?
	 * @param resource
	 * @return the {@link Predicate} that determines what is allowed
	 */
	public static Predicate createAllowlistFromPatterns(InputStream resource) {
		List patterns = createPatternsFromInputStream(resource);
		return new RegexPredicate(patterns);
	}

	/**
	 * Creates an instance that uses the default URL allowlist. The allowlist is expected to
	 * be updated in upcoming releases, but generally contains
	 *
	 * 
	 *     localhost
	 *     URLs that use a TLD defined in https://tools.ietf.org/html/rfc2606 (i.e. tld of test, .example, invalid, localhost)
	 *     XML Namespace names (not the locations)
	 *     Java specific URLs that do not work over http. For example, Java Properties
	 *     hard codes using http.
	 *     
	 * 
	 * @return the {@link Predicate} that determines what is allowed
	 * @deprecated Use {@link #createDefaultUrlAllowlist()}
	 */
	@Deprecated
	public static Predicate createDefaultUrlWhitelist() {
		return createDefaultUrlAllowlist();
	}

	/**
	 * Creates a {@link Predicate} from an {@link InputStream}.
	 * The format of the {@link InputStream} contains regular expressions of what inputs
	 * should be allowed such that:
	 *
	 * 
	 *     Each line contains a regular expression that should be allowed
	 *     Lines can begin with // to create a comment within the file
	 *     Lines are trimmed for whitespace
	 *     Lines that are empty are ignored
	 * 
	 *
	 * An example file can be found below:
	 *
	 * 	 * // Ignore Maven XML Namespace id of http://maven.apache.org/POM/4.0.0
	 * ^http://maven\.apache\.org/POM/4.0.0$
	 * // Allow Company XML namespace names but not the locations (which end in .xsd)
	 * ^http://mycompany.test/xml/.*(?
	 * @param resource
	 * @return the {@link Predicate} that determines what is allowed
	 * @deprecated Use {@link #createAllowlistFromPatterns(InputStream)}
	 */
	@Deprecated
	public static Predicate createWhitelistFromPatterns(InputStream resource) {
		return createAllowlistFromPatterns(resource);
	}

	/**
	 * Reads an input stream and creates {@link Pattern} from the {@link InputStream} using
	 * logic defined in {@link #createPatternsFromInputStream(InputStream)}
	 * @param resource the resource to load
	 * @return a {@link List} of {@link Pattern}s
	 */
	private static List createPatternsFromInputStream(InputStream resource) {
		if (resource == null) {
			throw new IllegalStateException("Failed to load allowed from " + resource);
		}
		InputStreamReader input = new InputStreamReader(resource);

		try (BufferedReader reader = new BufferedReader(input)) {
			return reader.lines()
					.map(String::trim)
					.filter(l -> !l.startsWith("//"))
					.filter(l -> l.length() != 0)
					.map(Pattern::compile)
					.collect(Collectors.toList());
		} catch (IOException e) {
			throw new IllegalStateException(e);
		}

	}
}
    

    

    
            
    
            

    
        
            
                Related Artifacts
                
                     mysql-connector-java mysql
 facebook-messenger com.github.codedrinker
 selenium-java org.seleniumhq.selenium
 instagram-java com.github.sola92
 gson com.google.code.gson
 poi org.apache.poi
 httpclient org.apache.httpcomponents
 json org.json
 facebook-java-api com.google.code.facebook-java-api
 poi-ooxml org.apache.poi
 jackson-databind com.fasterxml.jackson.core
 junit junit
 primefaces org.primefaces
 ojdbc7 com.github.noraui
 jfoenix com.jfoenix
 testng org.testng
 json-simple com.googlecode.json-simple
 selenium-server org.seleniumhq.selenium
 itextpdf com.itextpdf
 spring-core org.springframework
                
            
        
        
            
                Related Groups
                
                     org.springframework
 org.apache.poi
 org.hibernate
 org.springframework.boot
 com.fasterxml.jackson.core
 com.itextpdf
 org.seleniumhq.selenium
 mysql
 org.finos.legend.engine
 org.apache.httpcomponents
 org.apache.logging.log4j
 org.openjfx
 org.apache.commons
 org.json
 com.google.guava
 com.google.zxing
 net.sf.jasperreports
 javax.xml.bind
 ojdbc
 com.google.code.facebook-java-api