All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.jpedal.examples.viewer.commands.javafx.JavaFXExtractText Maven / Gradle / Ivy

There is a newer version: 7.15.25
Show newest version
/*
 * ===========================================
 * Java Pdf Extraction Decoding Access Library
 * ===========================================
 *
 * Project Info:  http://www.idrsolutions.com
 * Help section for developers at http://www.idrsolutions.com/support/
 *
 * (C) Copyright 1997-2017 IDRsolutions and Contributors.
 *
 * This file is part of JPedal/JPDF2HTML5
 *
 @LICENSE@
 *
 * ---------------
 * JavaFXExtractText.java
 * ---------------
 */
package org.jpedal.examples.viewer.commands.javafx;

import javafx.beans.value.ChangeListener;
import javafx.beans.value.ObservableValue;
import javafx.css.Styleable;
import javafx.event.ActionEvent;
import javafx.event.EventHandler;
import javafx.geometry.Insets;
import javafx.geometry.Pos;
import javafx.scene.Scene;
import javafx.scene.control.*;
import javafx.scene.layout.*;
import javafx.stage.Modality;
import javafx.stage.Stage;
import org.jpedal.PdfDecoderInt;
import org.jpedal.examples.viewer.Values;
import org.jpedal.examples.viewer.commands.generic.GUICopy;
import org.jpedal.examples.viewer.commands.generic.GUIExtractText;
import org.jpedal.examples.viewer.gui.javafx.dialog.FXDialog;
import org.jpedal.examples.viewer.gui.javafx.dialog.FXMessageDialog;
import org.jpedal.gui.GUIFactory;
import org.jpedal.objects.PdfPageData;
import org.jpedal.utils.Messages;

/**
 * Class to Handle the popup dialogs created when user right clicks
 * highlighted text and chooses text extraction.
 */
public class JavaFXExtractText extends GUIExtractText {

    public static void execute(final Object[] args, final GUIFactory currentGUI, final PdfDecoderInt decode_pdf, final Values commonValues) {
        if (args == null) {
            extractSelectedText(currentGUI, decode_pdf, commonValues);
        } else {

        }
    }

    /**
     * routine to link GUI into text extraction functions
     */
    private static void extractSelectedText(final GUIFactory currentGUI, final PdfDecoderInt decode_pdf, final Values commonValues) {

        if (!decode_pdf.isExtractionAllowed()) {
            currentGUI.showMessageDialog("Not allowed");
            return;
        }

        final int[][] highlights = decode_pdf.getTextLines().getHighlightedAreasAs2DArray(commonValues.getCurrentPage());

        if (highlights == null) {
            currentGUI.showMessageDialog("There is no text selected.\nPlease highlight the text you wish to extract.", "No Text selected", FXMessageDialog.ERROR_MESSAGE);

            return;
        }

        final BorderPane border = new BorderPane();
        final FXDialog textExtractionOptions = new FXDialog((Stage) currentGUI.getFrame(), Modality.APPLICATION_MODAL, border, 300, 300);
        textExtractionOptions.setTitle("Text Extraction Options");

        //Set up Radiobuttons
        final HBox radButtons = new HBox();
        final RadioButton rectangle = new RadioButton("Rectangle");
        rectangle.setId("rectangleExtraction");
        final RadioButton table = new RadioButton("Table");
        table.setId("tableExtraction");
        final RadioButton wordList = new RadioButton("WordList");
        wordList.setId("wordListExtraction");
        radButtons.getChildren().addAll(rectangle, table, wordList);

        table.setPadding(new Insets(0, 0, 0, 20));
        wordList.setPadding(new Insets(0, 0, 0, 45));
        border.setTop(radButtons);

        //Set up Selectedtext Area
        final TextArea selection = new TextArea();
        border.setCenter(selection);

        //Setup bottom Radio Buttons and Bottom Buttons
        final VBox allBottom = new VBox();
        final HBox bottomButtons = new HBox(15);
        final HBox bottomRadioButtons = new HBox();
        final RadioButton extractAsXML = new RadioButton("Extract as XML");
        final RadioButton extractAsText = new RadioButton("Extract as Text");
        final Button help = new Button("Help");
        final Button cancel = new Button("Cancel");
        cancel.setOnAction(new EventHandler() {
            @Override
            public void handle(final javafx.event.ActionEvent e) {
                textExtractionOptions.close();
            }
        });
        final Button extractButton = new Button("Extract");
        extractButton.setVisible(true); //currently disabled button until window is coded.
        final Region spacer = new Region();
        HBox.setHgrow(spacer, Priority.ALWAYS);
        bottomRadioButtons.getChildren().addAll(extractAsXML, spacer, extractAsText);
        bottomButtons.setAlignment(Pos.BOTTOM_RIGHT);
        bottomButtons.getChildren().addAll(help, cancel, extractButton);
        allBottom.getChildren().addAll(bottomRadioButtons, bottomButtons);

        extractAsXML.setPadding(new Insets(0, 0, 0, 10));
        extractAsText.setPadding(new Insets(0, 10, 13, 0));
        bottomButtons.setPadding(new Insets(0, 5, 10, 0));

        help.setOnAction(new EventHandler() {
            @Override
            public void handle(final ActionEvent t) {
                currentGUI.showMessageDialog(Messages.getMessage("PdfViewerGroupingInfo.message"));
            }
        });

        //Add format buttons to a toggle group, so only one be selected.
        final ToggleGroup formatGroup = new ToggleGroup();
        rectangle.setSelected(true);
        formatGroup.getToggles().addAll(rectangle, table, wordList);

        final ChangeListener updateSelectionListener = new ChangeListener() {
            @Override
            public void changed(final ObservableValue ov,
                                final Toggle old_toggle, final Toggle new_toggle) {
                selection.setText(updateSelection(formatGroup.getSelectedToggle(), extractAsXML.isSelected(), decode_pdf, commonValues, currentGUI));
            }
        };

        formatGroup.selectedToggleProperty().addListener(updateSelectionListener);

        //Add extraction mode to a toggle group, so only one be selected.
        final ToggleGroup extractionGroup = new ToggleGroup();
        extractAsText.setSelected(true);
        extractionGroup.getToggles().addAll(extractAsXML, extractAsText);

        extractionGroup.selectedToggleProperty().addListener(updateSelectionListener);

        extractButton.setOnAction(new EventHandler() {
            @Override
            public void handle(final ActionEvent t) {
                createExtractionWindow(formatGroup.getSelectedToggle(), extractAsXML.isSelected(), decode_pdf, commonValues, currentGUI);
            }
        });

        selection.setText(updateSelection(formatGroup.getSelectedToggle(), extractAsXML.isSelected(), decode_pdf, commonValues, currentGUI));
        border.setBottom(allBottom);

        BorderPane.setMargin(selection, new Insets(10, 10, 10, 10));
        BorderPane.setMargin(radButtons, new Insets(10, 10, 10, 10));
        BorderPane.setMargin(bottomRadioButtons, new Insets(10, 10, 10, 10));
        BorderPane.setMargin(bottomButtons, new Insets(10, 10, 10, 10));

        textExtractionOptions.show();


    }

    private static String updateSelection(final Toggle selected, final boolean isXML, final PdfDecoderInt decode_pdf, final Values commonValues, final GUIFactory currentGUI) {
        final StringBuilder finalValue = new StringBuilder(""); // Total data extracted so far
        try {

            final PdfPageData page_data = decode_pdf.getPdfPageData();

            final int cropX = page_data.getCropBoxX(commonValues.getCurrentPage());
            final int cropY = page_data.getCropBoxY(commonValues.getCurrentPage());
            final int cropW = page_data.getCropBoxWidth(commonValues.getCurrentPage());
            final int cropH = page_data.getCropBoxHeight(commonValues.getCurrentPage());

            final int[][] highlights = decode_pdf.getTextLines().getHighlightedAreasAs2DArray(commonValues.getCurrentPage());
            if (highlights != null) {
                for (int t = 0; t != highlights.length; t++) {
                    String extractedText = "";
                    if (highlights[t] != null) {

                        highlights[t] = GUICopy.adjustHighlightForExtraction(highlights[t]);

                        int t_x1 = highlights[t][0];
                        int t_x2 = highlights[t][0] + highlights[t][2];
                        int t_y1 = highlights[t][1] + highlights[t][3];
                        int t_y2 = highlights[t][1];

                        if (t_y1 < t_y2) {
                            final int temp = t_y2;
                            t_y2 = t_y1;
                            t_y1 = temp;
                        }

                        if (t_x1 > t_x2) {
                            final int temp = t_x2;
                            t_x2 = t_x1;
                            t_x1 = temp;
                        }

                        if (t_x1 < cropX) {
                            t_x1 = cropX;
                        }
                        if (t_x1 > cropX + cropW) {
                            t_x1 = cropX + cropW;
                        }

                        if (t_x2 < cropX) {
                            t_x2 = cropX;
                        }
                        if (t_x2 > cropX + cropW) {
                            t_x2 = cropX + cropW;
                        }

                        if (t_y1 < cropY) {
                            t_y1 = cropY;
                        }
                        if (t_y1 > cropY + cropH) {
                            t_y1 = cropY + cropH;
                        }

                        if (t_y2 < cropY) {
                            t_y2 = cropY;
                        }
                        if (t_y2 > cropY + cropH) {
                            t_y2 = cropY + cropH;
                        }

                        if ("rectangleExtraction".equals(((Styleable) selected).getId())) {

                            //text extraction
                            extractedText = extractTextRectangle(commonValues, decode_pdf, currentGUI, isXML, t_x1, t_x2, t_y1, t_y2) + ((char) 0x0D) + ((char) 0x0A);
                        } else if ("tableExtraction".equals(((Styleable) selected).getId())) {
                            //text table extraction
                            extractedText = extractTextTable(commonValues, decode_pdf, isXML, t_x1, t_x2, t_y1, t_y2);
                        } else if ("wordListExtraction".equals(((Styleable) selected).getId())) {
                            //text wordlist extraction
                            extractedText = extractTextList(decode_pdf, commonValues, currentGUI, isXML, t_x1, t_x2, t_y1, t_y2);
                        }

                        finalValue.append(extractedText);
                    }
                }
            }
        } catch (final Exception e) {
            e.printStackTrace();
        }

        return finalValue.toString();
    }

    private static void createExtractionWindow(final Toggle selected, final boolean isXML, final PdfDecoderInt decode_pdf, final Values commonValues, final GUIFactory currentGUI) {

        final Stage extractionDialog = new Stage();

        final TextArea ta = new TextArea();

        final Scene scene = new Scene(ta);
        extractionDialog.setTitle("Extracted Text");

        extractionDialog.setScene(scene);

        ta.setText(updateSelection(selected, isXML, decode_pdf, commonValues, currentGUI));

        extractionDialog.show();

    }
}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy