All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.lumongo.server.rest.TermsResource Maven / Gradle / Ivy

The newest version!
package org.lumongo.server.rest;

import com.cedarsoftware.util.io.JsonWriter;
import com.google.protobuf.InvalidProtocolBufferException;
import com.google.protobuf.util.JsonFormat;
import com.mongodb.util.JSONSerializers;
import org.bson.Document;
import org.lumongo.LumongoConstants;
import org.lumongo.cluster.message.Lumongo;
import org.lumongo.server.index.LumongoIndexManager;

import javax.ws.rs.DefaultValue;
import javax.ws.rs.GET;
import javax.ws.rs.Path;
import javax.ws.rs.Produces;
import javax.ws.rs.QueryParam;
import javax.ws.rs.core.Context;
import javax.ws.rs.core.MediaType;
import javax.ws.rs.core.Response;
import java.util.ArrayList;
import java.util.List;

@Path(LumongoConstants.TERMS_URL)
public class TermsResource {

	private LumongoIndexManager indexManager;

	public TermsResource(LumongoIndexManager indexManager) {
		this.indexManager = indexManager;
	}

	@GET
	@Produces({ MediaType.APPLICATION_JSON + ";charset=utf-8", MediaType.TEXT_PLAIN + ";charset=utf-8" })
	public Response get(@Context Response response, @QueryParam(LumongoConstants.INDEX) final String indexName,
			@QueryParam(LumongoConstants.FIELDS) final String field, @QueryParam(LumongoConstants.AMOUNT) final Integer amount,
			@QueryParam(LumongoConstants.MIN_DOC_FREQ) final Integer minDocFreq, @QueryParam(LumongoConstants.MIN_TERM_FREQ) final Integer minTermFreq,
			@QueryParam(LumongoConstants.START_TERM) final String startTerm, @QueryParam(LumongoConstants.END_TERM) final String endTerm,
			@QueryParam(LumongoConstants.TERM_FILTER) final String termFilter, @QueryParam(LumongoConstants.TERM_MATCH) final String termMatch,
			@QueryParam(LumongoConstants.INCLUDE_TERM) final List includeTerm, @QueryParam(LumongoConstants.FUZZY_TERM_JSON) final String fuzzyTermJson,
			@QueryParam(LumongoConstants.PRETTY) boolean pretty, @QueryParam(LumongoConstants.FORMAT) @DefaultValue("json") final String format) {

		if (indexName != null && field != null) {

			Lumongo.GetTermsRequest.Builder termsBuilder = Lumongo.GetTermsRequest.newBuilder();
			termsBuilder.setIndexName(indexName);
			termsBuilder.setFieldName(field);
			if (amount != null) {
				termsBuilder.setAmount(amount);
			}

			if (minDocFreq != null) {
				termsBuilder.setMinDocFreq(minDocFreq);
			}
			if (minTermFreq != null) {
				termsBuilder.setMinTermFreq(minTermFreq);
			}

			if (startTerm != null) {
				termsBuilder.setStartTerm(startTerm);
			}
			if (endTerm != null) {
				termsBuilder.setEndTerm(endTerm);
			}

			if (termFilter != null) {
				termsBuilder.setTermFilter(termFilter);
			}
			if (termMatch != null) {
				termsBuilder.setTermMatch(termMatch);
			}

			if (includeTerm != null) {
				termsBuilder.addAllIncludeTerm(includeTerm);
			}

			if (fuzzyTermJson != null) {
				try {
					Lumongo.FuzzyTerm.Builder fuzzyTermBuilder = Lumongo.FuzzyTerm.newBuilder();
					JsonFormat.parser().merge(fuzzyTermJson, fuzzyTermBuilder);
					termsBuilder.setFuzzyTerm(fuzzyTermBuilder);
				}

				catch (InvalidProtocolBufferException e) {
					return Response.status(LumongoConstants.INTERNAL_ERROR)
							.entity("Failed to parse analyzer json: " + e.getClass().getSimpleName() + ":" + e.getMessage()).build();
				}

			}

			try {
				Lumongo.GetTermsResponse terms = indexManager.getTerms(termsBuilder.build());

				if (format.equalsIgnoreCase("json")) {
					Document document = new Document();
					document.put("index", indexName);
					document.put("field", field);

					List termsDocs = new ArrayList<>();
					for (Lumongo.Term term : terms.getTermList()) {
						Document termDoc = new Document();
						termDoc.put("term", term.getValue());
						termDoc.put("docFreq", term.getDocFreq());
						termDoc.put("termFreq", term.getTermFreq());
						if (term.hasScore()) {
							termDoc.put("score", term.getScore());
						}
						termsDocs.add(termDoc);
					}

					document.put("terms", termsDocs);
					String docString = JSONSerializers.getStrict().serialize(document);

					if (pretty) {
						docString = JsonWriter.formatJson(docString);
					}

					return Response.status(LumongoConstants.SUCCESS).type(MediaType.APPLICATION_JSON_TYPE + ";charset=utf-8").entity(docString).build();
				}
				else {

					StringBuilder csvString = new StringBuilder();

					csvString.append("term");
					csvString.append(",");
					csvString.append("termFreq");
					csvString.append(",");
					csvString.append("docFreq");
					if (termsBuilder.hasFuzzyTerm()) {
						csvString.append(",");
						csvString.append("score");
					}
					csvString.append("\n");

					for (Lumongo.Term term : terms.getTermList()) {
						String value = term.getValue();
						if (value.contains(",") || value.contains(" ") || value.contains("\"") || value.contains("\n")) {
							csvString.append("\"");
							csvString.append(value.replace("\"", "\"\""));
							csvString.append("\"");
						}
						else {
							csvString.append(value);
						}
						csvString.append(",");
						csvString.append(term.getTermFreq());
						csvString.append(",");
						csvString.append(term.getDocFreq());
						if (term.hasScore()) {
							csvString.append(",");
							csvString.append(term.getScore());
						}
						csvString.append("\n");
					}
					return Response.status(LumongoConstants.SUCCESS).type(MediaType.TEXT_PLAIN + ";charset=utf-8").entity(csvString.toString()).build();
				}

			}
			catch (Exception e) {
				return Response.status(LumongoConstants.INTERNAL_ERROR).entity("Failed to fetch fields for index <" + indexName + ">: " + e.getMessage())
						.build();
			}
		}
		else {
			return Response.status(LumongoConstants.INTERNAL_ERROR).entity("No index or field defined").build();
		}

	}

}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy