All Downloads are FREE. Search and download functionalities are using the official Maven repository.

net.dankito.readability4j.Article.kt Maven / Gradle / Ivy

Go to download

A Kotlin port of Mozilla‘s Readability. It extracts a website‘s relevant content and removes all clutter from it.

The newest version!
package net.dankito.readability4j

import org.jsoup.nodes.Element


open class Article(

        /**
         * Original uri object that was passed to constructor
         */
        val uri: String

) {

        /**
         * Article title
         */
        var title: String? = null

        var articleContent: Element? = null

        /**
         * HTML string of processed article content
         */
        val content: String?
                get() = articleContent?.html() // TODO: but this removes paging information (pages in top node 
) val textContent: String? get() = articleContent?.text() /** * Length of article, in characters */ var length: Int = -1 get() = textContent?.length ?: -1 /** * Article description, or short excerpt from content */ var excerpt: String? = null /** * Author metadata */ var byline: String? = null /** * Content direction */ var dir: String? = null }




© 2015 - 2024 Weber Informatics LLC | Privacy Policy