All Downloads are FREE. Search and download functionalities are using the official Maven repository.

io.zulia.server.rest.TermsResource Maven / Gradle / Ivy

package io.zulia.server.rest;

import com.cedarsoftware.util.io.JsonWriter;
import com.google.protobuf.InvalidProtocolBufferException;
import com.google.protobuf.util.JsonFormat;
import io.zulia.ZuliaConstants;
import io.zulia.server.index.ZuliaIndexManager;
import org.bson.Document;

import javax.ws.rs.DefaultValue;
import javax.ws.rs.GET;
import javax.ws.rs.Path;
import javax.ws.rs.Produces;
import javax.ws.rs.QueryParam;
import javax.ws.rs.core.Context;
import javax.ws.rs.core.MediaType;
import javax.ws.rs.core.Response;
import java.util.ArrayList;
import java.util.List;

import static io.zulia.message.ZuliaBase.FuzzyTerm;
import static io.zulia.message.ZuliaBase.Term;
import static io.zulia.message.ZuliaServiceOuterClass.GetTermsRequest;
import static io.zulia.message.ZuliaServiceOuterClass.GetTermsResponse;

/**
 * Created by Payam Meyer on 8/7/17.
 * @author pmeyer
 */
@Path(ZuliaConstants.TERMS_URL)
public class TermsResource {

	private ZuliaIndexManager indexManager;

	public TermsResource(ZuliaIndexManager indexManager) {
		this.indexManager = indexManager;
	}

	@GET
	@Produces({ MediaType.APPLICATION_JSON + ";charset=utf-8", MediaType.TEXT_PLAIN + ";charset=utf-8" })
	public Response get(@Context Response response, @QueryParam(ZuliaConstants.INDEX) final String indexName,
			@QueryParam(ZuliaConstants.FIELDS) final String field, @QueryParam(ZuliaConstants.AMOUNT) final Integer amount,
			@QueryParam(ZuliaConstants.MIN_DOC_FREQ) final Integer minDocFreq, @QueryParam(ZuliaConstants.MIN_TERM_FREQ) final Integer minTermFreq,
			@QueryParam(ZuliaConstants.START_TERM) final String startTerm, @QueryParam(ZuliaConstants.END_TERM) final String endTerm,
			@QueryParam(ZuliaConstants.TERM_FILTER) final String termFilter, @QueryParam(ZuliaConstants.TERM_MATCH) final String termMatch,
			@QueryParam(ZuliaConstants.INCLUDE_TERM) final List includeTerm, @QueryParam(ZuliaConstants.FUZZY_TERM_JSON) final String fuzzyTermJson,
			@QueryParam(ZuliaConstants.PRETTY) boolean pretty, @QueryParam(ZuliaConstants.FORMAT) @DefaultValue("json") final String format) {

		if (indexName != null && field != null) {

			GetTermsRequest.Builder termsBuilder = GetTermsRequest.newBuilder();
			termsBuilder.setIndexName(indexName);
			termsBuilder.setFieldName(field);
			if (amount != null) {
				termsBuilder.setAmount(amount);
			}

			if (minDocFreq != null) {
				termsBuilder.setMinDocFreq(minDocFreq);
			}
			if (minTermFreq != null) {
				termsBuilder.setMinTermFreq(minTermFreq);
			}

			if (startTerm != null) {
				termsBuilder.setStartTerm(startTerm);
			}
			if (endTerm != null) {
				termsBuilder.setEndTerm(endTerm);
			}

			if (termFilter != null) {
				termsBuilder.setTermFilter(termFilter);
			}
			if (termMatch != null) {
				termsBuilder.setTermMatch(termMatch);
			}

			if (includeTerm != null) {
				termsBuilder.addAllIncludeTerm(includeTerm);
			}

			if (fuzzyTermJson != null) {
				try {
					FuzzyTerm.Builder fuzzyTermBuilder = FuzzyTerm.newBuilder();
					JsonFormat.parser().merge(fuzzyTermJson, fuzzyTermBuilder);
					termsBuilder.setFuzzyTerm(fuzzyTermBuilder);
				}

				catch (InvalidProtocolBufferException e) {
					return Response.status(ZuliaConstants.INTERNAL_ERROR)
							.entity("Failed to parse analyzer json: " + e.getClass().getSimpleName() + ":" + e.getMessage()).build();
				}

			}

			try {
				GetTermsResponse terms = indexManager.getTerms(termsBuilder.build());

				if (format.equalsIgnoreCase("json")) {
					Document document = new Document();
					document.put("index", indexName);
					document.put("field", field);

					List termsDocs = new ArrayList<>();
					for (Term term : terms.getTermList()) {
						Document termDoc = new Document();
						termDoc.put("term", term.getValue());
						termDoc.put("docFreq", term.getDocFreq());
						termDoc.put("termFreq", term.getTermFreq());
						termDoc.put("score", term.getScore());
						termsDocs.add(termDoc);
					}

					document.put("terms", termsDocs);
					String docString = document.toJson();

					if (pretty) {
						docString = JsonWriter.formatJson(docString);
					}

					return Response.status(ZuliaConstants.SUCCESS).type(MediaType.APPLICATION_JSON_TYPE + ";charset=utf-8").entity(docString).build();
				}
				else {

					StringBuilder csvString = new StringBuilder();

					csvString.append("term");
					csvString.append(",");
					csvString.append("termFreq");
					csvString.append(",");
					csvString.append("docFreq");
					if (termsBuilder.hasFuzzyTerm()) {
						csvString.append(",");
						csvString.append("score");
					}
					csvString.append("\n");

					for (Term term : terms.getTermList()) {
						String value = term.getValue();
						if (value.contains(",") || value.contains(" ") || value.contains("\"") || value.contains("\n")) {
							csvString.append("\"");
							csvString.append(value.replace("\"", "\"\""));
							csvString.append("\"");
						}
						else {
							csvString.append(value);
						}
						csvString.append(",");
						csvString.append(term.getTermFreq());
						csvString.append(",");
						csvString.append(term.getDocFreq());
						csvString.append(",");
						csvString.append(term.getScore());
						csvString.append("\n");
					}
					return Response.status(ZuliaConstants.SUCCESS).type(MediaType.TEXT_PLAIN + ";charset=utf-8").entity(csvString.toString()).build();
				}

			}
			catch (Exception e) {
				return Response.status(ZuliaConstants.INTERNAL_ERROR).entity("Failed to fetch fields for index <" + indexName + ">: " + e.getMessage()).build();
			}
		}
		else {
			return Response.status(ZuliaConstants.INTERNAL_ERROR).entity("No index or field defined").build();
		}

	}

}




© 2015 - 2025 Weber Informatics LLC | Privacy Policy