org.semanticwb.resource.office.sem.WordResource Maven / Gradle / Ivy

Go to download
Show more of this group Show more artifacts with this name
Show all versions of SWBOffice Show documentation
MS Office plugin implementation for SemanticWebBuilder
The newest version!
/*
 * SemanticWebBuilder es una plataforma para el desarrollo de portales y aplicaciones de integración,
 * colaboración y conocimiento, que gracias al uso de tecnología semántica puede generar contextos de
 * información alrededor de algún tema de interés o bien integrar información y aplicaciones de diferentes
 * fuentes, donde a la información se le asigna un significado, de forma que pueda ser interpretada y
 * procesada por personas y/o sistemas, es una creación original del Fondo de Información y Documentación
 * para la Industria INFOTEC, cuyo registro se encuentra actualmente en trámite.
 *
 * INFOTEC pone a su disposición la herramienta SemanticWebBuilder a través de su licenciamiento abierto al público (‘open source’),
 * en virtud del cual, usted podrá usarlo en las mismas condiciones con que INFOTEC lo ha diseñado y puesto a su disposición;
 * aprender de él; distribuirlo a terceros; acceder a su código fuente y modificarlo, y combinarlo o enlazarlo con otro software,
 * todo ello de conformidad con los términos y condiciones de la LICENCIA ABIERTA AL PÚBLICO que otorga INFOTEC para la utilización
 * del SemanticWebBuilder 4.0.
 *
 * INFOTEC no otorga garantía sobre SemanticWebBuilder, de ninguna especie y naturaleza, ni implícita ni explícita,
 * siendo usted completamente responsable de la utilización que le dé y asumiendo la totalidad de los riesgos que puedan derivar
 * de la misma.
 *
 * Si usted tiene cualquier duda o comentario sobre SemanticWebBuilder, INFOTEC pone a su disposición la siguiente
 * dirección electrónica:
 *  http://www.semanticwebbuilder.org
 */
package org.semanticwb.resource.office.sem;

import com.arthurdo.parser.HtmlStreamTokenizer;
import com.arthurdo.parser.HtmlTag;
import java.io.BufferedReader;
import java.io.ByteArrayInputStream;
import java.io.File;
import java.io.FileInputStream;
import java.io.FileNotFoundException;
import java.io.FileReader;
import java.io.IOException;
import java.io.PrintWriter;
import java.io.UnsupportedEncodingException;
import java.util.Enumeration;
import javax.servlet.http.*;
import org.semanticwb.Logger;
import org.semanticwb.SWBPortal;
import org.semanticwb.SWBUtils;
import org.semanticwb.model.Resource;
import org.semanticwb.model.User;
import org.semanticwb.model.WebPage;
import org.semanticwb.office.comunication.OfficeDocument;
import org.semanticwb.platform.SemanticObject;
import org.semanticwb.portal.api.*;
import org.semanticwb.portal.util.ContentUtils;

// TODO: Auto-generated Javadoc
/**
 * The Class WordResource.
 * 
 * @author Jorge Jiménez
 */
public class WordResource extends org.semanticwb.resource.office.sem.base.WordResourceBase
{

    /** The log. */
    private static Logger log = SWBUtils.getLogger(WordResource.class);
    /** The Constant contentUtils. */
    private static final ContentUtils contentUtils = new ContentUtils();
    /** The snpages. */
    int snpages = 15;
    /** The stxtant. */
    String stxtant = "Anterior";
    /** The stxtsig. */
    String stxtsig = "Siguiente";
    /** The stfont. */
    String stfont = "font face=\"Verdana, Arial, Helvetica, sans-serif\" size=\"2\" color=\"#000000\"";
    /** The position. */
    int position = 1;

    /**
     * Instantiates a new word resource.
     */
    public WordResource()
    {
        super();
    }

    /**
     * Instantiates a new word resource.
     * 
     * @param obj the obj
     */
    public WordResource(SemanticObject obj)
    {
        super(obj);
    }

    /**
     * Before print document.
     * 
     * @param out the out
     */
    protected void beforePrintDocument(PrintWriter out)
    {
    }

    /**
     * After print document.
     * 
     * @param out the out
     */
    protected void afterPrintDocument(PrintWriter out)
    {
    }

    /**
     * Gets the hTML.
     * 
     * @param file the file
     * @return the hTML
     */
    public static String getHTML(File file)
    {
        String name = file.getName();
        name = name.replace(".doc", ".html");
        StringBuilder html = new StringBuilder();
        try
        {
            name = java.net.URLDecoder.decode(name, "utf-8");
            file = new File(file.getParent() + "/" + name);




            FileInputStream in = new FileInputStream(file);
            byte[] buffer = new byte[2048];
            int read = in.read(buffer);
            while (read != -1)
            {
                html.append(new String(buffer, 0, read));
                read = in.read(buffer);
            }
            String workpath = file.getAbsolutePath().replace('\\', '/');
            String applicationpath = SWBUtils.getApplicationPath();
            if (workpath.toLowerCase().startsWith(applicationpath.toLowerCase()))
            {
                workpath = workpath.substring(0, applicationpath.length());
                workpath = SWBPortal.getContextPath() + workpath;
            }
            return SWBPortal.UTIL.parseHTML(html.toString(), workpath);

        }
        catch (UnsupportedEncodingException uee)
        {
            log.error(uee);
        }
        catch (FileNotFoundException uee)
        {
            log.error(uee);
        }
        catch (IOException uee)
        {
            log.error(uee);
        }
        return html.toString();

    }

    /**
     * Prints the document.
     * 
     * @param out the out
     * @param path the path
     * @param workpath the workpath
     * @param html the html
     */
    protected void printDocument(PrintWriter out, String path, String workpath, String html)
    {
        out.write(html);
    }

    /**
     * Creates the word resource.
     * 
     * @param id the id
     * @param model the model
     * @return the org.semanticwb.resource.office.sem. word resource
     */
    public static org.semanticwb.resource.office.sem.WordResource createWordResource(String id, org.semanticwb.model.SWBModel model)
    {
        return (org.semanticwb.resource.office.sem.WordResource) model.getSemanticObject().getModel().createGenericObject(model.getSemanticObject().getModel().getObjectUri(id, sclass), sclass);
    }

    /* (non-Javadoc)
     * @see org.semanticwb.resource.office.sem.OfficeResource#doView(HttpServletRequest, HttpServletResponse, SWBParamRequest)
     */
    @Override
    public void doView(HttpServletRequest request, HttpServletResponse response, SWBParamRequest paramRequest) throws SWBResourceException, IOException
    {

        Resource base = paramRequest.getResourceBase();
        WebPage page = paramRequest.getWebPage();
        try
        {

            User user = paramRequest.getUser();
            String file = null;
            if (this.getResourceBase().getAttribute(OfficeDocument.FILE_HTML) == null)
            {
                updateFileCache(user);
                file = this.getResourceBase().getAttribute(OfficeDocument.FILE_HTML);
            }
            else
            {
                file = this.getResourceBase().getAttribute(OfficeDocument.FILE_HTML);
            }
            if (file != null)
            {
                file = file.replace(".doc", ".html");
                file = java.net.URLDecoder.decode(file, "utf-8");
                String path = SWBPortal.getWorkPath();
                if (path.endsWith("/"))
                {
                    path = path.substring(0, path.length() - 1);
                    path += getResourceBase().getWorkPath() + "/" + file;
                }
                else
                {
                    path += getResourceBase().getWorkPath() + "/" + file;
                }

                File filecontent = new File(path);
                if (!filecontent.exists())
                {
                    updateFileCache(user);
                    file = this.getResourceBase().getAttribute(OfficeDocument.FILE_HTML);
                    file = file.replace(".doc", ".html");
                    file = java.net.URLDecoder.decode(file, "utf-8");
                    path = SWBPortal.getWorkPath();
                    if (path.endsWith("/"))
                    {
                        path = path.substring(0, path.length() - 1);
                        path += getResourceBase().getWorkPath() + "/" + file;
                    }
                    else
                    {
                        path += getResourceBase().getWorkPath() + "/" + file;
                    }
                    filecontent = new File(path);
                }
                if (filecontent.exists())
                {

                    boolean isutf8 = false;
                    try
                    {
                        isutf8 = SWBUtils.IO.isUTF8(filecontent);
                    }
                    catch (IOException ioe)
                    {
                        log.error(ioe);
                    }
                    String workpath = SWBPortal.getWebWorkPath() + getResourceBase().getWorkPath() + "/";
                    StringBuilder html = new StringBuilder();
                    try
                    {
                        if (isutf8)
                        {
                            FileReader reader = null;
                            try
                            {
                                reader = new FileReader(filecontent);
                                BufferedReader br = new BufferedReader(reader);
                                String line = br.readLine();
                                while (line != null)
                                {
                                    if (isutf8)
                                    {
                                        line = new String(line.getBytes(reader.getEncoding()), "utf-8");
                                    }
                                    html.append(line);
                                    html.append("\r\n");
                                    line = br.readLine();
                                }
                            }
                            catch (Exception ioe)
                            {
                                log.error(ioe);
                            } finally
                            {
                                if (reader != null)
                                {
                                    try
                                    {
                                        reader.close();
                                    }
                                    catch (IOException ioe)
                                    {
                                        log.error(ioe);
                                    }
                                }
                            }

                        }
                        else
                        {
                            FileInputStream in = null;
                            try
                            {
                                in = new FileInputStream(filecontent);
                                byte[] buffer = new byte[2048];
                                int read = in.read(buffer);
                                while (read != -1)
                                {
                                    html.append(new String(buffer, 0, read));
                                    read = in.read(buffer);
                                }
                            }
                            catch (Exception ioe)
                            {
                                log.error(ioe);
                            } finally
                            {
                                if (in != null)
                                {
                                    try
                                    {
                                        in.close();
                                    }
                                    catch (IOException ioe)
                                    {
                                        log.error(ioe);
                                    }
                                }
                            }
                        }
                        String htmlOut = null;
                        if (isPages() && getNpages() > 0)
                        {
                            htmlOut = SWBPortal.UTIL.parseHTML(html.toString(), workpath, getNpages());
                        }
                        else
                        {
                            htmlOut = SWBPortal.UTIL.parseHTML(html.toString(), workpath);
                        }
                        PrintWriter out = response.getWriter();
                        beforePrintDocument(out);

                        //Agregado por Jorge Jiménez para poner estilos predefinidos y paginación MsWord y OpenOffice (5/07/2009)
                        if (paramRequest.getLocaleString("txtant") != null)
                        {
                            stxtant = paramRequest.getLocaleString("txtant");
                        }
                        if (paramRequest.getLocaleString("txtsig") != null)
                        {
                            stxtsig = paramRequest.getLocaleString("txtsig");
                        }
                        if (getNpages() > 0)
                        {
                            snpages = getNpages();
                        }
                        if (getTxtant() != null && getTxtant().trim().length() > 0)
                        {
                            stxtant = getTxtant();
                        }
                        if (getTxtsig() != null && getTxtsig().trim().length() > 0)
                        {
                            stxtsig = getTxtsig();
                        }
                        if (getTfont() != null && getTfont().trim().length() > 0)
                        {
                            stfont = getTfont();
                        }
                        if (getPosition() > 0)
                        {
                            position = getPosition();
                        }

                        boolean iswordcontent = true;
                        int posword = htmlOut.toLowerCase().indexOf("name=\"generator\" content=\"openoffice.org"); //detección de si el contenido es de openOffice
                        if (posword > -1)
                        {
                            iswordcontent = false;
                        }

                        if (iswordcontent)
                        { //Contenido MsWord
                            htmlOut = contentUtils.predefinedStyles(htmlOut, base, isTpred()); //Estilos predefinidos
                            if (isPages())
                            {
                                htmlOut = contentUtils.paginationMsWord(request, htmlOut, page, request.getParameter("page"), base, snpages, stxtant, stxtsig, stfont, position);
                            } //Paginación
                        }
                        else if (isPages())
                        { //Contenido OpenOffice
                            htmlOut = contentUtils.paginationOpenOffice(request, htmlOut, page, request.getParameter("page"), base, snpages, stxtant, stxtsig, stfont, position); //Paginación
                        }
                        //Termina Agregado por Jorge Jiménez (5/07/2009)
                        // eliminar , etc

                        boolean deletestyles = false;
                        try
                        {
                            deletestyles = this.isDeletestyles();
                        }
                        catch (Exception e)
                        {
                            log.error(e);
                        }
                        htmlOut = cleanHTML(htmlOut, deletestyles);
                        printDocument(out, path, workpath, htmlOut);
                        afterPrintDocument(out);
                        out.close();
                    }
                    catch (Exception e)
                    {
                        log.error(e);
                    }

                }
                else
                {
                    log.error("Contenido no encontrado en ruta: " + filecontent.getAbsolutePath() + ": " + getContent() + "@" + getRepositoryName());
                }
            }
        }
        catch (Exception e)
        {
            log.error(e);
        }
    }

    /**
     * Clean html.
     * 
     * @param datos the datos
     * @param deletesytyles the deletesytyles
     * @return the string
     */
    public static String cleanHTML(String datos, boolean deletesytyles)
    {
        HtmlStreamTokenizer tok = new HtmlStreamTokenizer(new ByteArrayInputStream(datos.getBytes()));
        StringBuilder ret = new StringBuilder();
        HtmlTag tag = new HtmlTag();
        boolean omit = false;
        try
        {
            while (tok.nextToken() != HtmlStreamTokenizer.TT_EOF)
            {
                int ttype = tok.getTokenType();
                if (ttype == HtmlStreamTokenizer.TT_TAG || ttype == HtmlStreamTokenizer.TT_COMMENT)
                {
                    if (ttype == HtmlStreamTokenizer.TT_COMMENT && tok.getRawString().equals(""))
                    {
                        continue;
                    }
                    tok.parseTag(tok.getStringValue(), tag);

                    if (tok.getRawString().toLowerCase().startsWith("