All Downloads are FREE. Search and download functionalities are using the official Maven repository.

org.apache.kylin.streaming.jobs.StreamingSegmentManager Maven / Gradle / Ivy

The newest version!
/*
 * Licensed to the Apache Software Foundation (ASF) under one
 * or more contributor license agreements.  See the NOTICE file
 * distributed with this work for additional information
 * regarding copyright ownership.  The ASF licenses this file
 * to you under the Apache License, Version 2.0 (the
 * "License"); you may not use this file except in compliance
 * with the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */

package org.apache.kylin.streaming.jobs;

import org.apache.commons.lang3.StringUtils;
import org.apache.kylin.common.KylinConfig;
import org.apache.kylin.common.response.RestResponse;
import org.apache.kylin.common.util.RandomUtil;
import org.apache.kylin.job.execution.JobTypeEnum;
import org.apache.kylin.metadata.model.SegmentRange;
import org.apache.kylin.metadata.cube.model.LayoutEntity;
import org.apache.kylin.metadata.cube.model.NDataLayout;
import org.apache.kylin.metadata.cube.model.NDataSegment;
import org.apache.kylin.metadata.cube.model.NDataflowManager;
import org.apache.kylin.metadata.cube.utils.StreamingUtils;
import org.apache.kylin.metadata.project.EnhancedUnitOfWork;
import org.apache.kylin.streaming.request.StreamingSegmentRequest;
import org.apache.kylin.streaming.rest.RestSupport;
import org.apache.kylin.streaming.util.JobExecutionIdHolder;
import org.apache.spark.sql.SparkSession;
import org.apache.spark.sql.kafka010.OffsetRangeManager;

import lombok.val;
import lombok.extern.slf4j.Slf4j;

@Slf4j
public class StreamingSegmentManager {

    private static final String SEGMENT_POST_URL = "/streaming_jobs/dataflow/segment";

    public static NDataSegment allocateSegment(SparkSession ss, String dataflowId, String project, Long batchMinTime,
            Long batchMaxTime) {
        return allocateSegment(ss, null, dataflowId, project, batchMinTime, batchMaxTime);
    }

    public static NDataSegment allocateSegment(SparkSession ss, SegmentRange.KafkaOffsetPartitionedSegmentRange sr,
            String dataflowId, String project, Long batchMinTime, Long batchMaxTime) {
        if (sr == null) {
            val offsetRange = OffsetRangeManager.currentOffsetRange(ss);
            sr = new SegmentRange.KafkaOffsetPartitionedSegmentRange(batchMinTime, batchMaxTime,
                    OffsetRangeManager.partitionOffsets(offsetRange._1),
                    OffsetRangeManager.partitionOffsets(offsetRange._2));
        }
        NDataSegment newSegment;
        KylinConfig config = KylinConfig.getInstanceFromEnv();
        if (config.isUTEnv()) {
            val segRange = sr;
            newSegment = EnhancedUnitOfWork.doInTransactionWithCheckAndRetry(() -> {
                NDataflowManager dfMgr = NDataflowManager.getInstance(KylinConfig.getInstanceFromEnv(), project);
                return dfMgr.appendSegmentForStreaming(dfMgr.getDataflow(dataflowId), segRange);
            }, project);
            return newSegment;
        } else {
            StreamingSegmentRequest req = new StreamingSegmentRequest(project, dataflowId);
            req.setSegmentRange(sr);
            req.setNewSegId(RandomUtil.randomUUIDStr());
            req.setJobType(JobTypeEnum.STREAMING_BUILD.name());
            val jobId = StreamingUtils.getJobId(dataflowId, req.getJobType());
            req.setJobExecutionId(JobExecutionIdHolder.getJobExecutionId(jobId));
            try(RestSupport rest = new RestSupport(config)) {
                RestResponse restResponse = rest.execute(rest.createHttpPost(SEGMENT_POST_URL), req);
                String newSegId = restResponse.getData();
                StreamingUtils.replayAuditlog();
                if (!StringUtils.isEmpty(newSegId)) {
                    NDataflowManager dfMgr = NDataflowManager.getInstance(config, project);
                    newSegment = dfMgr.getDataflow(dataflowId).getSegment(newSegId);
                    for (LayoutEntity layout : newSegment.getIndexPlan().getAllLayouts()) {
                        NDataLayout ly = NDataLayout.newDataLayout(newSegment.getDataflow(), newSegment.getId(),
                                layout.getId());
                        newSegment.getLayoutsMap().put(ly.getLayoutId(), ly);
                    }
                    return newSegment;
                } else {
                    val empSeg = NDataSegment.empty();
                    empSeg.setId(StringUtils.EMPTY);
                    return empSeg;
                }
            }
        }
    }

}




© 2015 - 2024 Weber Informatics LLC | Privacy Policy