All Downloads are FREE. Search and download functionalities are using the official Maven repository.

com.day.cq.polling.importer.HttpImporter Maven / Gradle / Ivy

There is a newer version: 2024.11.18751.20241128T090041Z-241100
Show newest version
/*
 * Copyright 1997-2009 Day Management AG
 * Barfuesserplatz 6, 4001 Basel, Switzerland
 * All Rights Reserved.
 *
 * This software is the confidential and proprietary information of
 * Day Management AG, ("Confidential Information"). You shall not
 * disclose such Confidential Information and shall use it only in
 * accordance with the terms of the license agreement you entered into
 * with Day.
 */
package com.day.cq.polling.importer;

import java.io.IOException;
import java.io.InputStream;

import org.apache.commons.httpclient.Credentials;
import org.apache.commons.httpclient.HttpClient;
import org.apache.commons.httpclient.HttpConnectionManager;
import org.apache.commons.httpclient.HttpException;
import org.apache.commons.httpclient.HttpMethodBase;
import org.apache.commons.httpclient.HttpStatus;
import org.apache.commons.httpclient.MultiThreadedHttpConnectionManager;
import org.apache.commons.httpclient.UsernamePasswordCredentials;
import org.apache.commons.httpclient.auth.AuthScope;
import org.apache.commons.httpclient.methods.GetMethod;
import org.apache.felix.scr.annotations.Component;
import org.apache.felix.scr.annotations.Properties;
import org.apache.felix.scr.annotations.Property;
import org.apache.felix.scr.annotations.Service;
import org.apache.sling.api.resource.Resource;
import org.osgi.service.component.ComponentContext;

/**
 * The HttpImporter is an abstract implementation of the
 * {@link Importer} service interface supporting access to data using the HTTP
 * protocol.
 * 

* Extensions of this base class must implement the * {@link #importData(String, InputStream, String, Resource)} method to actuall * import the retrieved data. *

* Instanes of this base class must be initialized before being used and * be destroyed when not used any more. If the extesion is registered as an * Declarative Services Component, this initialization and destroyal is being * taken care of. Otherwise, the extension class must explicitly call the * {@link #init()} and {@link #destroy()} methods respectively. *

* The {@link #activate(ComponentContext)} and * {@link #deactivate(ComponentContext)} methods may be overwritten by extension * classes but the base class implementation must called in this case to * ensure proper initialization and destroyal. * * @deprecated Please use {@link HCImporter} instead. */ @Component(metatype = false, componentAbstract = true) @Service(Importer.class) @Properties({ @Property(name = "service.description", value = "Abstract HTTP based Importer") }) @Deprecated public abstract class HttpImporter implements Importer { /** * The HTTP Client used by this importer instance. This field is initialized * on demand by the {@link #getHttpClient()} method and cleared by the * {@link #destroy()} method. */ private HttpClient httpClient; /** * Actually imports the data recevied from the data source into the target * Resource. *

* Implementations of this method need not (and should not) close the * data input stream. This will be taken care of the caller of * this method. * * @param scheme The scheme describing the data to import. * @param data The data to be imported. * @param characterEncoding If the data contains character data, such as * XML, this parameter (may) provide the character encoding of * the character data. The value of this parameter is extracted * from the Content-Type header of the HTTP response * and may thus be empty or null if not set by the * server. * @param target The Resource into which the data is to be * imported. * @throws IOException May be thrown if an error occurrs reading or writing * the imported data. * @throws ImportException May be thrown in any other error case. */ protected abstract void importData(String scheme, InputStream data, String characterEncoding, Resource target) throws IOException; // ---------- Importer interface /** * Imports data from the given source which is expected to be * an HTTP URL. This method uses the Apache Commons Http Client library to * request the source with a method provided by {@link #newHttpMethod(String)} the * response stream is then provided to the * {@link #importData(String, InputStream, String, Resource)} method, which * must be implemented by the extension. * * @param scheme The scheme of the data source. This parameter is handed * over to the * {@link #importData(String, InputStream, String, Resource)} * method. * @param dataSource The HTTP URL to the data to be imported. * @param target The Resource into which the data is to be * imported. * @throws ImportException If an error occurrs while accessing the source or * if this class has not beenn initialized or if an error occurs * while importing the actual data through * {@link #importData(String, InputStream, String, Resource)}. */ public void importData(String scheme, String dataSource, Resource target) { importData(scheme, dataSource, target, null, null); } /** * Imports data from the given source which is expected to be * an HTTP URL. This method uses the Apache Commons Http Client library to * request the source with a method provided by {@link #newHttpMethod(String)} the * response stream is then provided to the * {@link #importData(String, InputStream, String, Resource)} method, which * must be implemented by the extension. * * @param scheme The scheme of the data source. This parameter is handed * over to the * {@link #importData(String, InputStream, String, Resource)} * method. * @param dataSource The HTTP URL to the data to be imported. * @param target The Resource into which the data is to be * imported. * @param login The login to authenticate the request. * @param password The password to authenticate the request. * @throws ImportException If an error occurrs while accessing the source or * if this class has not beenn initialized or if an error occurs * while importing the actual data through * {@link #importData(String, InputStream, String, Resource)}. */ public void importData(String scheme, String dataSource, Resource target, String login, String password) { // the method to execute HttpMethodBase method = newHttpMethod(dataSource); InputStream ins = null; try { // if login information is present, setup the authentication on the httpclient if (login != null && login.length() > 0 && password != null && password.length() > 0) { getHttpClient().getParams().setAuthenticationPreemptive(true); Credentials defaultcreds = new UsernamePasswordCredentials(login, password); getHttpClient().getState().setCredentials(AuthScope.ANY, defaultcreds); } // execute the request and check the status int statusCode = getHttpClient().executeMethod(method); switch (statusCode) { case HttpStatus.SC_OK: // this what we expect break; case HttpStatus.SC_NOT_MODIFIED: // no change in data, so just get back out of here return; default: // this is what we don't expect throw new ImportException("Failed retreiving data" + method.getStatusLine()); } // access the raw response stream and import it ins = method.getResponseBodyAsStream(); importData(scheme, ins, method.getResponseCharSet(), target); } catch (HttpException e) { throw new ImportException("Fatal protocol violation", e); } catch (IOException e) { throw new ImportException("Fatal transport error", e); } catch (IllegalStateException ise) { throw new ImportException( "HttpImporter has not been initialized yet", ise); } catch (Exception e) { throw new ImportException( "Unexpected problem while importing data", e); } finally { // close the response input stream if (ins != null) { try { ins.close(); } catch (IOException ioe) { } } // Release the connection. method.releaseConnection(); } } /** * Returns a HttpClient instance used by the * {@link #importData(String, InputStream, String, Resource)} method to * access the data source URL. The HttpClient instance is * backed by a MultiThreadedHttpConnectionManager. *

* This method cannot be overwritten. To configure the HttpClient, the * {@link #init()} method should be called with appropriate parameters which * are used to setup the client with an instance of the * HttpClientParams class. * * @return the HttpClient instance. * @see #init() */ protected final HttpClient getHttpClient() { if (httpClient == null) { httpClient = new HttpClient( new MultiThreadedHttpConnectionManager()); } return httpClient; } /** * Returns a HttpMethodBase instance used by the * {@link #importData(String, String, Resource)} method to actually retrieve * the data to be imported from the data source URL. *

* This base class implementation returns a plain GetMethod. * Extensions may overwrite to implement more soffisticated method setup. *

* Each call to this method must return a new instance of the * HttpMethodBase implementation. The * {@link #importData(String, String, Resource)} method using this instance * takes care to release the connection of the method when being done. * * @param source The data source URL for which to prepare the method * instance. * @return The HttpMethodBase to import the data, which is in * this base class implementation a GetMethod instance. */ protected HttpMethodBase newHttpMethod(String source) { return new GetMethod(source); } /** * Initializes this base class implementation. This method must be * called before the {@link #importData(String, String, Resource)} may be * used. *

* If the class is used as a Declarative Services component, this method * need not be called explicitly, since the * {@link #activate(ComponentContext)} method will call it. *

* This method may be called multiple times. After a first initialization * further successive calls without {@link #destroy() destroyal} will have * no effect. */ protected final void init() { // nothing at the moment, might set configuration } /** * Destroys this base class implementation. This method must be * called when the instance is not used any more. *

* If the class is used as a Declarative Services component, this method * need not be called explicitly, since the * {@link #deactivate(ComponentContext)} method will call it. *

* This method may be called multiple times. After a first destroyal further * successive calls without {@link #init() initialization} will have no * effect. */ protected final void destroy() { if (httpClient != null) { HttpConnectionManager cm = httpClient.getHttpConnectionManager(); if (cm instanceof MultiThreadedHttpConnectionManager) { ((MultiThreadedHttpConnectionManager) cm).shutdown(); } httpClient = null; } } // ---------- SCR integration /** * This base class implementation currently just calls the {@link #init()} * method. Nevertheless it must be called if overwritten! * * @param context Component context */ protected void activate(ComponentContext context) { init(); } /** * This base class implementation currently just calls the * {@link #destroy()} method. Nevertheless it must be called if * overwritten! * * @param context Component context */ protected void deactivate(ComponentContext context) { destroy(); } }





© 2015 - 2025 Weber Informatics LLC | Privacy Policy