toolkit.analyzer.3.0.0.source-code.PackageManager.kt Maven / Gradle / Ivy
Go to download
Show more of this group Show more artifacts with this name
Show all versions of analyzer Show documentation
Show all versions of analyzer Show documentation
Part of the OSS Review Toolkit (ORT), a suite to automate software compliance checks.
/*
* Copyright (C) 2017 The ORT Project Authors (see )
*
* Licensed under the Apache License, Version 2.0 (the "License");
* you may not use this file except in compliance with the License.
* You may obtain a copy of the License at
*
* https://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing, software
* distributed under the License is distributed on an "AS IS" BASIS,
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
* See the License for the specific language governing permissions and
* limitations under the License.
*
* SPDX-License-Identifier: Apache-2.0
* License-Filename: LICENSE
*/
package org.ossreviewtoolkit.analyzer
import java.io.File
import java.nio.file.FileSystems
import java.nio.file.FileVisitResult
import java.nio.file.Files
import java.nio.file.Path
import java.nio.file.SimpleFileVisitor
import java.nio.file.attribute.BasicFileAttributes
import kotlin.io.path.invariantSeparatorsPathString
import kotlin.time.measureTime
import org.apache.logging.log4j.kotlin.Logging
import org.apache.maven.project.ProjectBuildingException
import org.ossreviewtoolkit.downloader.VcsHost
import org.ossreviewtoolkit.downloader.VersionControlSystem
import org.ossreviewtoolkit.model.DependencyGraph
import org.ossreviewtoolkit.model.Identifier
import org.ossreviewtoolkit.model.Project
import org.ossreviewtoolkit.model.ProjectAnalyzerResult
import org.ossreviewtoolkit.model.VcsInfo
import org.ossreviewtoolkit.model.VcsType
import org.ossreviewtoolkit.model.config.AnalyzerConfiguration
import org.ossreviewtoolkit.model.config.Excludes
import org.ossreviewtoolkit.model.config.PackageManagerConfiguration
import org.ossreviewtoolkit.model.config.RepositoryConfiguration
import org.ossreviewtoolkit.model.createAndLogIssue
import org.ossreviewtoolkit.utils.common.Options
import org.ossreviewtoolkit.utils.common.Plugin
import org.ossreviewtoolkit.utils.common.VCS_DIRECTORIES
import org.ossreviewtoolkit.utils.common.collectMessages
import org.ossreviewtoolkit.utils.common.isSymbolicLink
import org.ossreviewtoolkit.utils.ort.ORT_CONFIG_FILENAME
import org.ossreviewtoolkit.utils.ort.normalizeVcsUrl
import org.ossreviewtoolkit.utils.ort.showStackTrace
typealias ManagedProjectFiles = Map>
typealias ProjectResults = Map>
/**
* A class representing a package manager that handles software dependencies. The package manager is referred to by its
* [managerName]. The analysis of any projects and their dependencies starts in the [analysisRoot] directory using the
* given general [analyzerConfig]. Per-repository configuration is passed in [repoConfig].
*/
abstract class PackageManager(
val managerName: String,
val analysisRoot: File,
val analyzerConfig: AnalyzerConfiguration,
val repoConfig: RepositoryConfiguration
) {
companion object : Logging {
/**
* All [package manager factories][PackageManagerFactory] available in the classpath, associated by their names.
*/
val ALL by lazy { Plugin.getAll() }
/**
* The available [package manager factories][PackageManagerFactory] that are enabled by default.
*/
val ENABLED_BY_DEFAULT by lazy { ALL.values.filter { it.isEnabledByDefault } }
private val PACKAGE_MANAGER_DIRECTORIES = setOf(
// Ignore intermediate build system directories.
".gradle",
".yarn",
"node_modules",
// Ignore resources in a standard Maven / Gradle project layout.
"META-INF/maven",
"src/main/resources",
"src/test/resources",
// Ignore virtual environments in Python.
"lib/python2.*/dist-packages",
"lib/python3.*/site-packages"
)
private val IGNORED_DIRECTORY_MATCHERS = (VCS_DIRECTORIES + PACKAGE_MANAGER_DIRECTORIES).map {
FileSystems.getDefault().getPathMatcher("glob:**/$it")
}
/**
* Recursively search the [directory] for files managed by any of the [packageManagers]. The search is performed
* depth-first so that root project files are found before any subproject files for a specific manager. Path
* excludes defined by the given [excludes] are taken into account; the corresponding directories are skipped.
*/
fun findManagedFiles(
directory: File,
packageManagers: Collection = ENABLED_BY_DEFAULT,
excludes: Excludes = Excludes.EMPTY
): ManagedProjectFiles {
require(directory.isDirectory) {
"The provided path is not a directory: ${directory.absolutePath}"
}
logger.debug { "Searching for managed files using the following excludes: $excludes" }
val result = mutableMapOf>()
val rootPath = directory.toPath()
Files.walkFileTree(
rootPath,
object : SimpleFileVisitor() {
override fun preVisitDirectory(dir: Path, attributes: BasicFileAttributes): FileVisitResult {
if (IGNORED_DIRECTORY_MATCHERS.any { it.matches(dir) }) {
logger.info {
"Not analyzing directory '$dir' as it is hard-coded to be ignored."
}
return FileVisitResult.SKIP_SUBTREE
}
if (excludes.isPathExcluded(rootPath, dir)) {
logger.info {
"Not analyzing directory '$dir' as it is excluded."
}
return FileVisitResult.SKIP_SUBTREE
}
val dirAsFile = dir.toFile()
// Note that although FileVisitOption.FOLLOW_LINKS is not set, this would still follow junctions
// on Windows, so do a better check here.
if (dirAsFile.isSymbolicLink()) {
logger.info { "Not following symbolic link to directory '$dir'." }
return FileVisitResult.SKIP_SUBTREE
}
val filesInDir = dirAsFile.walk().maxDepth(1).filter {
it.isFile && !excludes.isPathExcluded(rootPath, it.toPath())
}.toList()
packageManagers.distinct().forEach { manager ->
// Create a list of lists of matching files per glob.
val matchesPerGlob = manager.matchersForDefinitionFiles.mapNotNull { glob ->
// Create a list of files in the current directory that match the current glob.
val filesMatchingGlob = filesInDir.filter { glob.matches(it.toPath()) }
filesMatchingGlob.takeIf { it.isNotEmpty() }
}
if (matchesPerGlob.isNotEmpty()) {
// Only consider all matches for the first glob that has matches. This is because globs
// are defined in order of priority, and multiple globs may just be alternative ways to
// detect the exact same project.
// That is, at the example of a PIP project, if a directory contains all three files
// "requirements-py2.txt", "requirements-py3.txt" and "setup.py", only consider the
// former two as they match the glob with the highest priority, but ignore "setup.py".
result.getOrPut(manager) { mutableListOf() } += matchesPerGlob.first()
}
}
return FileVisitResult.CONTINUE
}
}
)
return result
}
/**
* Enrich a [package's VCS information][vcsFromPackage] with information deduced from the package's VCS URL or a
* [list of fallback URLs][fallbackUrls] (the first element that is recognized as a VCS URL is used).
*/
fun processPackageVcs(vcsFromPackage: VcsInfo, vararg fallbackUrls: String): VcsInfo {
val normalizedVcsFromPackage = vcsFromPackage.normalize()
val fallbackVcs = fallbackUrls.mapTo(mutableListOf(VcsHost.parseUrl(normalizedVcsFromPackage.url))) {
VcsHost.parseUrl(normalizeVcsUrl(it))
}.find {
// Ignore fallback VCS information that changes a known type, or where the VCS type is unknown.
if (normalizedVcsFromPackage.type != VcsType.UNKNOWN) {
it.type == normalizedVcsFromPackage.type
} else {
it.type != VcsType.UNKNOWN
}
}
if (fallbackVcs != null) {
// Enrich (not overwrite) the normalized VCS information from the package...
val mergedVcs = normalizedVcsFromPackage.merge(fallbackVcs)
if (mergedVcs != normalizedVcsFromPackage) {
// ... but if indeed metadata was enriched, overwrite the URL with the one from the fallback VCS
// information to ensure we get the correct base URL if additional VCS information (like a revision
// or path) has been split from the original URL.
return mergedVcs.copy(url = fallbackVcs.url)
}
}
return normalizedVcsFromPackage
}
/**
* Enrich VCS information determined from the [project's directory][projectDir] with VCS information determined
* from the [project's metadata][vcsFromProject], if any, and from a [list of fallback URLs][fallbackUrls] (the
* first element that is recognized as a VCS URL is used).
*/
fun processProjectVcs(
projectDir: File,
vcsFromProject: VcsInfo = VcsInfo.EMPTY,
vararg fallbackUrls: String
): VcsInfo {
val vcsFromWorkingTree = VersionControlSystem.getPathInfo(projectDir).normalize()
return vcsFromWorkingTree.merge(processPackageVcs(vcsFromProject, *fallbackUrls))
}
/**
* Return an [Excludes] instance to be applied during analysis based on the given [repositoryConfiguration].
* If this [AnalyzerConfiguration] has the [AnalyzerConfiguration.skipExcluded] flag set to true, the
* excludes configured in [repositoryConfiguration] are actually applied. Otherwise, return an empty [Excludes]
* object. This means that all dependencies are collected, and excludes are applied later on the report level.
*/
internal fun AnalyzerConfiguration.excludes(repositoryConfiguration: RepositoryConfiguration): Excludes =
repositoryConfiguration.excludes.takeIf { skipExcluded } ?: Excludes.EMPTY
/**
* Check whether the given [path] interpreted relatively against [root] is matched by a path exclude in this
* [Excludes] object.
*/
private fun Excludes.isPathExcluded(root: Path, path: Path): Boolean =
isPathExcluded(root.relativize(path).invariantSeparatorsPathString)
/**
* Get a fallback project name from the [definitionFile] path relative to the [analysisRoot]. This function
* should be used if the project name cannot be determined from the project's metadata.
*/
fun getFallbackProjectName(analysisRoot: File, definitionFile: File) =
definitionFile.relativeTo(analysisRoot).invariantSeparatorsPath
}
/**
* The [Options] from the [PackageManagerConfiguration] for this [package manager][managerName].
*/
protected val options: Options = analyzerConfig.getPackageManagerConfiguration(managerName)?.options.orEmpty()
/**
* The [Excludes] to take into account during analysis. The [Excludes] from the [RepositoryConfiguration] are
* taken into account only if this is enabled in the [AnalyzerConfiguration].
*/
val excludes by lazy { analyzerConfig.excludes(repoConfig) }
/**
* Optional mapping of found [definitionFiles] before dependency resolution.
*/
open fun mapDefinitionFiles(definitionFiles: List): List = definitionFiles
/**
* Return if this package manager must run before or after certain other package managers. This can manually be
* configured by the user in [PackageManagerConfiguration.mustRunAfter], but in some cases it is possible to
* determine such dependencies automatically.
*/
open fun findPackageManagerDependencies(
managedFiles: Map>
): PackageManagerDependencyResult =
PackageManagerDependencyResult(mustRunBefore = emptySet(), mustRunAfter = emptySet())
/**
* Optional step to run before dependency resolution, like checking for prerequisites.
*/
protected open fun beforeResolution(definitionFiles: List) {}
/**
* Optional step to run after dependency resolution, like cleaning up temporary files.
*/
protected open fun afterResolution(definitionFiles: List) {}
/**
* Generate the final result to be returned by this package manager. This function is called at the very end of the
* execution of this package manager (after [afterResolution]) with the [projectResults] created for the single
* definition files that have been processed. It can be overridden by subclasses to add additional data to the
* result. This base implementation produces a result that contains only the passed in map with project results.
*/
protected open fun createPackageManagerResult(projectResults: ProjectResults) = PackageManagerResult(projectResults)
/**
* Return a tree of resolved dependencies (not necessarily declared dependencies, in case conflicts were resolved)
* for all [definitionFiles] which were found by searching the [analysisRoot] directory. By convention, the
* [definitionFiles] must be absolute. The given [labels] are parameters to the overall analysis of the project and
* to further stages. They are not interpreted by ORT, but can be used to configure behavior of custom package
* manager implementations.
*/
open fun resolveDependencies(definitionFiles: List, labels: Map): PackageManagerResult {
definitionFiles.forEach { definitionFile ->
requireNotNull(definitionFile.relativeToOrNull(analysisRoot)) {
"'$definitionFile' must be an absolute path below '$analysisRoot'."
}
}
val result = mutableMapOf>()
beforeResolution(definitionFiles)
definitionFiles.forEach { definitionFile ->
val relativePath = definitionFile.relativeTo(analysisRoot).invariantSeparatorsPath.ifEmpty { "." }
logger.info { "Using $managerName to resolve dependencies for path '$relativePath'..." }
val duration = measureTime {
runCatching {
result[definitionFile] = resolveDependencies(definitionFile, labels)
}.onFailure {
it.showStackTrace()
// In case of Maven we might be able to do better than inferring the name from the path.
val id = if (it is ProjectBuildingException && it.projectId?.isEmpty() == false) {
Identifier("Maven:${it.projectId}")
} else {
Identifier.EMPTY.copy(type = managerName, name = relativePath)
}
val projectWithIssues = Project.EMPTY.copy(
id = id,
definitionFilePath = VersionControlSystem.getPathInfo(definitionFile).path,
vcsProcessed = processProjectVcs(definitionFile.parentFile),
scopeDependencies = null,
scopeNames = emptySet()
)
val issues = listOf(
createAndLogIssue(
source = managerName,
message = "$managerName failed to resolve dependencies for path '$relativePath': " +
it.collectMessages()
)
)
result[definitionFile] = listOf(ProjectAnalyzerResult(projectWithIssues, emptySet(), issues))
}
}
logger.info { "$managerName resolved dependencies for path '$relativePath' in $duration." }
}
afterResolution(definitionFiles)
return createPackageManagerResult(result).addDependencyGraphIfMissing()
}
/**
* Resolve dependencies for a single absolute [definitionFile] and return a list of [ProjectAnalyzerResult]s, with
* one result for each project found in the definition file. The given [labels] are parameters to the overall
* analysis of the project and to further stages. They are not interpreted by ORT, but can be used to configure
* behavior of custom package manager implementations.
*/
abstract fun resolveDependencies(definitionFile: File, labels: Map): List
protected fun requireLockfile(workingDir: File, condition: () -> Boolean) {
require(analyzerConfig.allowDynamicVersions || condition()) {
val relativePathString = workingDir.relativeTo(analysisRoot).invariantSeparatorsPath
.takeUnless { it.isEmpty() } ?: "."
"No lockfile found in '$relativePathString'. This potentially results in unstable versions of " +
"dependencies. To support this, enable the 'allowDynamicVersions' option in '$ORT_CONFIG_FILENAME'."
}
}
/**
* Remove all packages from the contained [ProjectAnalyzerResult]s which are also projects.
*/
protected fun ProjectResults.filterProjectPackages(): ProjectResults {
val projectIds = flatMapTo(mutableSetOf()) { (_, projectResult) -> projectResult.map { it.project.id } }
return mapValues { entry ->
entry.value.map { projectResult ->
val projectReferences = projectResult.packages.filterTo(mutableSetOf()) { it.id in projectIds }
projectResult.takeIf { projectReferences.isEmpty() }
?: projectResult.copy(packages = projectResult.packages - projectReferences)
.also {
logger.info { "Removing ${projectReferences.size} packages that are projects." }
logger.debug { projectReferences.joinToString { it.id.toCoordinates() } }
}
}
}
}
}
/**
* Parse a string with metadata about an [author] to extract the author name. Many package managers support
* such author information in string form that contain additional properties like an email address or a
* homepage. These additional properties are typically separated from the author name by specific [delimiters],
* e.g. the email address is often surrounded by angle brackets. This function assumes that the author name is the
* first portion in the given [author] string before one of the given [delimiters] is found.
*/
fun parseAuthorString(author: String?, vararg delimiters: Char = charArrayOf('<')): String? =
author?.split(*delimiters, limit = 2)?.firstOrNull()?.trim()?.ifEmpty { null }
private fun PackageManagerResult.addDependencyGraphIfMissing(): PackageManagerResult {
// If the condition is true, then [CompatibilityDependencyNavigator] constructs a [DependencyGraphNavigator].
// That construction throws an exception if there is no dependency graph available.
val isGraphRequired = projectResults.values.flatten().any { it.project.scopeNames != null }
return if (isGraphRequired && dependencyGraph == null) {
copy(dependencyGraph = DependencyGraph())
} else {
this
}
}
© 2015 - 2025 Weber Informatics LLC | Privacy Policy