com.metaeffekt.artifact.terms.model.FileSegment Maven / Gradle / Ivy
The newest version!
/*
* Copyright 2021-2024 the original author or authors.
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*/
package com.metaeffekt.artifact.terms.model;
import com.metaeffekt.artifact.analysis.utils.StringStats;
import lombok.Getter;
import lombok.Setter;
import org.json.JSONArray;
/**
* Class to store several representations of a file segment for different purposes.
*/
public class FileSegment {
@Getter
private final String markedContent;
@Getter
private final StringStats normalizedContent;
@Getter
@Setter
private ScanResultPart normalizedSRP;
@Setter
@Getter
private JSONArray licenseVariables;
private final MatchPreprocessor matchPreprocessor;
public FileSegment(String markedSegmentContent, MatchPreprocessor matchPreprocessor) {
this.matchPreprocessor = matchPreprocessor;
// memorize the marked content
this.markedContent = markedSegmentContent;
// remove markers
final String markerFreeContent = matchPreprocessor.removeMarkers(markedSegmentContent);
// create initial normalized representation
final StringStats normalizedContent = StringStats.normalize(markerFreeContent, false);
// FIXME: AE-690 move masks before segmentation
// apply normalized masks
matchPreprocessor.getNormalizationMetaData().applyMasks(normalizedContent);
this.normalizedContent = normalizedContent;
}
public String getContent() {
return matchPreprocessor.removeMarkersForReadability(markedContent).trim();
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy