Skip to content

Commit 8e2a313

Browse files
committed
feat(PackageManager): Support path excludes in findManagedFiles()
This allows skipping projects in specific paths already before starting the analysis. That way problematic / large projects that are irrelevant compliance-wise can be excluded leading to reduced resource usage and analysis time. Signed-off-by: Oliver Heger <[email protected]>
1 parent 5571239 commit 8e2a313

File tree

2 files changed

+67
-18
lines changed

2 files changed

+67
-18
lines changed

analyzer/src/main/kotlin/PackageManager.kt

+17-3
Original file line numberDiff line numberDiff line change
@@ -27,6 +27,7 @@ import java.nio.file.Path
2727
import java.nio.file.SimpleFileVisitor
2828
import java.nio.file.attribute.BasicFileAttributes
2929

30+
import kotlin.io.path.pathString
3031
import kotlin.time.measureTime
3132

3233
import org.apache.logging.log4j.kotlin.Logging
@@ -99,20 +100,25 @@ abstract class PackageManager(
99100

100101
/**
101102
* Recursively search the [directory] for files managed by any of the [packageManagers]. The search is performed
102-
* depth-first so that root project files are found before any subproject files for a specific manager.
103+
* depth-first so that root project files are found before any subproject files for a specific manager. Path
104+
* excludes defined by the given [excludes] are taken into account; the corresponding directories are skipped.
103105
*/
104106
fun findManagedFiles(
105107
directory: File,
106-
packageManagers: Collection<PackageManagerFactory> = ALL.values
108+
packageManagers: Collection<PackageManagerFactory> = ALL.values,
109+
excludes: Excludes = EMPTY_EXCLUDES
107110
): ManagedProjectFiles {
108111
require(directory.isDirectory) {
109112
"The provided path is not a directory: ${directory.absolutePath}"
110113
}
111114

115+
logger.debug { "Searching for managed files using the following excludes: $excludes" }
116+
112117
val result = mutableMapOf<PackageManagerFactory, MutableList<File>>()
118+
val rootPath = directory.toPath()
113119

114120
Files.walkFileTree(
115-
directory.toPath(),
121+
rootPath,
116122
object : SimpleFileVisitor<Path>() {
117123
override fun preVisitDirectory(dir: Path, attributes: BasicFileAttributes): FileVisitResult {
118124
if (IGNORED_DIRECTORY_MATCHERS.any { it.matches(dir) }) {
@@ -123,6 +129,14 @@ abstract class PackageManager(
123129
return FileVisitResult.SKIP_SUBTREE
124130
}
125131

132+
if (excludes.isPathExcluded(rootPath.relativize(dir).pathString)) {
133+
logger.info {
134+
"Not analyzing directory '$dir' as it is matched by a path exclude."
135+
}
136+
137+
return FileVisitResult.SKIP_SUBTREE
138+
}
139+
126140
val dirAsFile = dir.toFile()
127141

128142
// Note that although FileVisitOption.FOLLOW_LINKS is not set, this would still follow junctions

analyzer/src/test/kotlin/PackageManagerTest.kt

+50-15
Original file line numberDiff line numberDiff line change
@@ -29,10 +29,16 @@ import io.kotest.matchers.maps.beEmpty
2929
import io.kotest.matchers.should
3030
import io.kotest.matchers.shouldBe
3131

32+
import java.io.File
33+
3234
import org.ossreviewtoolkit.analyzer.managers.*
3335
import org.ossreviewtoolkit.model.VcsInfo
3436
import org.ossreviewtoolkit.model.VcsType
37+
import org.ossreviewtoolkit.model.config.Excludes
38+
import org.ossreviewtoolkit.model.config.PathExclude
39+
import org.ossreviewtoolkit.model.config.PathExcludeReason
3540
import org.ossreviewtoolkit.utils.test.createSpecTempDir
41+
import org.ossreviewtoolkit.utils.test.createTestTempDir
3642

3743
class PackageManagerTest : WordSpec({
3844
val definitionFiles = listOf(
@@ -71,11 +77,7 @@ class PackageManagerTest : WordSpec({
7177
val projectDir = createSpecTempDir()
7278

7379
beforeSpec {
74-
definitionFiles.forEach { file ->
75-
projectDir.resolve(file).also { dir ->
76-
dir.parentFile.mkdirs()
77-
}.writeText("Dummy text to avoid the file to be empty, as empty files are skipped.")
78-
}
80+
definitionFiles.writeFiles(projectDir)
7981
}
8082

8183
"findManagedFiles" should {
@@ -88,11 +90,7 @@ class PackageManagerTest : WordSpec({
8890
it is Unmanaged.Factory
8991
}
9092

91-
// The keys in expected and actual maps of definition files are different instances of package manager
92-
// factories. So to compare values use the package manager types as keys instead.
93-
val managedFilesByName = managedFiles.map { (manager, files) ->
94-
manager.type to files.map { it.relativeTo(projectDir).invariantSeparatorsPath }
95-
}.toMap()
93+
val managedFilesByName = managedFiles.groupByName(projectDir)
9694

9795
assertSoftly {
9896
managedFilesByName["Bower"] should containExactly("bower/bower.json")
@@ -144,11 +142,7 @@ class PackageManagerTest : WordSpec({
144142

145143
managedFiles.size shouldBe 3
146144

147-
// The keys in expected and actual maps of definition files are different instances of package manager
148-
// factories. So to compare values use the package manager types as keys instead.
149-
val managedFilesByName = managedFiles.map { (manager, files) ->
150-
manager.type to files.map { it.relativeTo(projectDir).invariantSeparatorsPath }
151-
}.toMap()
145+
val managedFilesByName = managedFiles.groupByName(projectDir)
152146

153147
managedFilesByName["Gradle"] should containExactlyInAnyOrder(
154148
"gradle-groovy/build.gradle",
@@ -167,6 +161,26 @@ class PackageManagerTest : WordSpec({
167161
managedFiles should beEmpty()
168162
}
169163

164+
"take path excludes into account" {
165+
val tempDir = "test/"
166+
val definitionFilesWithExcludes = definitionFiles +
167+
listOf("pom.xml", "build.gradle", "build.sbt").map { "$tempDir$it" }
168+
val rootDir = createTestTempDir()
169+
definitionFilesWithExcludes.writeFiles(rootDir)
170+
171+
val pathExclude = PathExclude("$tempDir**", PathExcludeReason.TEST_OF)
172+
val excludes = Excludes(paths = listOf(pathExclude))
173+
174+
val managedFilesByName = PackageManager.findManagedFiles(rootDir, excludes = excludes).groupByName(rootDir)
175+
176+
managedFilesByName["Gradle"] should containExactlyInAnyOrder(
177+
"gradle-groovy/build.gradle",
178+
"gradle-kotlin/build.gradle.kts"
179+
)
180+
managedFilesByName["Maven"] should containExactly("maven/pom.xml")
181+
managedFilesByName["SBT"] should containExactly("sbt/build.sbt")
182+
}
183+
170184
"fail if the provided file is not a directory" {
171185
shouldThrow<IllegalArgumentException> {
172186
PackageManager.findManagedFiles(projectDir.resolve("pom.xml"))
@@ -221,3 +235,24 @@ class PackageManagerTest : WordSpec({
221235
}
222236
}
223237
})
238+
239+
/**
240+
* Transform this map with definition files grouped by package manager factories, so that the results of specific
241+
* package managers can be easily accessed. The keys in expected and actual maps of definition files are different
242+
* instances of package manager factories. So to compare values use the package manager types as keys instead.
243+
*/
244+
private fun ManagedProjectFiles.groupByName(projectDir: File) =
245+
map { (manager, files) ->
246+
manager.type to files.map { it.relativeTo(projectDir).invariantSeparatorsPath }
247+
}.toMap()
248+
249+
/**
250+
* Create files with a dummy content in the given [directory] for all the path names in this collection.
251+
*/
252+
private fun Collection<String>.writeFiles(directory: File) {
253+
forEach { file ->
254+
directory.resolve(file).also { dir ->
255+
dir.parentFile.mkdirs()
256+
}.writeText("Dummy text to avoid the file to be empty, as empty files are skipped.")
257+
}
258+
}

0 commit comments

Comments
 (0)