![JAR search and dependency download from the Maven repository](/logo.png)
net.dankito.readability4j.extended.Readability4JExtended.kt Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of Readability4J Show documentation
Show all versions of Readability4J Show documentation
A Kotlin port of Mozilla‘s Readability. It extracts a website‘s relevant content and removes all clutter from it.
The newest version!
package net.dankito.readability4j.extended
import net.dankito.readability4j.Readability4J
import net.dankito.readability4j.extended.processor.ArticleGrabberExtended
import net.dankito.readability4j.extended.processor.PostprocessorExtended
import net.dankito.readability4j.extended.util.RegExUtilExtended
import net.dankito.readability4j.model.ReadabilityOptions
import net.dankito.readability4j.processor.MetadataParser
import net.dankito.readability4j.processor.Preprocessor
import org.jsoup.Jsoup
import org.jsoup.nodes.Document
open class Readability4JExtended : Readability4J {
// for Java interoperability
/**
* Calls Readability(String, String, ReadabilityOptions) with default ReadabilityOptions
*/
constructor(uri: String, html: String) : this(uri, html, ReadabilityOptions())
constructor(uri: String, html: String, options: ReadabilityOptions = ReadabilityOptions(), regExUtil: RegExUtilExtended = RegExUtilExtended(),
preprocessor: Preprocessor = Preprocessor(regExUtil), metadataParser: MetadataParser = MetadataParser(regExUtil),
articleGrabber: ArticleGrabberExtended = ArticleGrabberExtended(options, regExUtil), postprocessor: PostprocessorExtended = PostprocessorExtended())
: this(uri, Jsoup.parse(html, uri), options, regExUtil, preprocessor, metadataParser, articleGrabber, postprocessor)
// for Java interoperability
/**
* Calls Readability(String, Document, ReadabilityOptions) with default ReadabilityOptions
*/
constructor(uri: String, document: Document) : this(uri, document, ReadabilityOptions())
constructor(uri: String, document: Document, options: ReadabilityOptions = ReadabilityOptions(), regExUtil: RegExUtilExtended = RegExUtilExtended(),
preprocessor: Preprocessor = Preprocessor(regExUtil), metadataParser: MetadataParser = MetadataParser(regExUtil),
articleGrabber: ArticleGrabberExtended = ArticleGrabberExtended(options, regExUtil), postprocessor: PostprocessorExtended = PostprocessorExtended())
: super(uri, document, options, regExUtil, preprocessor, metadataParser, articleGrabber, postprocessor)
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy