2020-01-27 12:05:34 -05:00
|
|
|
/*
|
|
|
|
* Licensed to the Apache Software Foundation (ASF) under one or more
|
|
|
|
* contributor license agreements. See the NOTICE file distributed with
|
|
|
|
* this work for additional information regarding copyright ownership.
|
|
|
|
* The ASF licenses this file to You under the Apache License, Version 2.0
|
|
|
|
* (the "License"); you may not use this file except in compliance with
|
|
|
|
* the License. You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing, software
|
|
|
|
* distributed under the License is distributed on an "AS IS" BASIS,
|
|
|
|
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
|
|
* See the License for the specific language governing permissions and
|
|
|
|
* limitations under the License.
|
|
|
|
*/
|
|
|
|
|
2020-01-27 11:29:59 -05:00
|
|
|
// This adds validation of project dependencies:
|
|
|
|
// 1) license file
|
|
|
|
// 2) notice file
|
|
|
|
// 3) checksum validation/ generation.
|
|
|
|
|
|
|
|
import org.apache.commons.codec.digest.DigestUtils
|
|
|
|
|
|
|
|
// This should be false only for debugging.
|
|
|
|
def failOnError = true
|
|
|
|
|
|
|
|
// Configure license checksum folder for top-level projects.
|
|
|
|
// (The file("licenses") inside the configure scope resolves
|
|
|
|
// relative to the current project so they're not the same).
|
2021-03-18 06:04:45 -04:00
|
|
|
configure(project(":lucene")) {
|
|
|
|
ext.licensesDir = file("licenses")
|
2020-01-27 11:29:59 -05:00
|
|
|
}
|
2021-03-08 08:59:08 -05:00
|
|
|
|
2020-01-27 11:29:59 -05:00
|
|
|
// All known license types. If 'noticeOptional' is true then
|
|
|
|
// the notice file must accompany the license.
|
|
|
|
def licenseTypes = [
|
|
|
|
"ASL" : [name: "Apache Software License 2.0"],
|
|
|
|
"BSD" : [name: "Berkeley Software Distribution"],
|
|
|
|
//BSD like just means someone has taken the BSD license and put in their name, copyright, or it's a very similar license.
|
|
|
|
"BSD_LIKE": [name: "BSD like license"],
|
|
|
|
"CDDL" : [name: "Common Development and Distribution License", noticeOptional: true],
|
|
|
|
"CPL" : [name: "Common Public License"],
|
|
|
|
"EPL" : [name: "Eclipse Public License Version 1.0", noticeOptional: true],
|
|
|
|
"MIT" : [name: "Massachusetts Institute of Tech. License", noticeOptional: true],
|
|
|
|
"MPL" : [name: "Mozilla Public License", noticeOptional: true /* NOT SURE on the required notice */],
|
|
|
|
"PD" : [name: "Public Domain", noticeOptional: true],
|
2021-10-30 13:52:57 -04:00
|
|
|
"PDDL" : [name: "Public Domain Dedication and License", noticeOptional: true],
|
2020-01-27 11:29:59 -05:00
|
|
|
"SUN" : [name: "Sun Open Source License", noticeOptional: true],
|
|
|
|
"COMPOUND": [name: "Compound license (details in NOTICE file)."],
|
|
|
|
]
|
|
|
|
|
|
|
|
allprojects {
|
|
|
|
task licenses() {
|
|
|
|
group = 'Dependency validation'
|
|
|
|
description = "Apply all dependency/ license checks."
|
|
|
|
}
|
|
|
|
check.dependsOn(licenses)
|
|
|
|
}
|
|
|
|
|
|
|
|
subprojects {
|
|
|
|
// Configure jarValidation configuration for all projects. Any dependency
|
|
|
|
// declared on this configuration (or any configuration it extends from) will
|
|
|
|
// be verified.
|
|
|
|
configurations {
|
|
|
|
jarValidation
|
|
|
|
}
|
|
|
|
|
|
|
|
// For Java projects, add all dependencies from the following configurations
|
|
|
|
// to jar validation
|
|
|
|
plugins.withType(JavaPlugin) {
|
|
|
|
configurations {
|
|
|
|
jarValidation {
|
|
|
|
extendsFrom runtimeClasspath
|
|
|
|
extendsFrom compileClasspath
|
|
|
|
extendsFrom testRuntimeClasspath
|
|
|
|
extendsFrom testCompileClasspath
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Collects dependency JAR information for a project and saves it in
|
|
|
|
// project.ext.jarInfos. Each dependency has a map of attributes
|
|
|
|
// which make it easier to process it later on (name, hash, origin module,
|
|
|
|
// see the code below for details).
|
|
|
|
task collectJarInfos() {
|
|
|
|
dependsOn configurations.jarValidation
|
|
|
|
|
|
|
|
doFirst {
|
|
|
|
// When gradle resolves a configuration it applies exclude rules from inherited configurations
|
|
|
|
// globally (this seems like a bug to me). So we process each inherited configuration independently
|
|
|
|
// but make sure there are no other dependencies on jarValidation itself.
|
|
|
|
if (!configurations.jarValidation.dependencies.isEmpty()) {
|
|
|
|
throw new GradleException("jarValidation must only inherit from other configurations (can't have its own dependencies).")
|
|
|
|
}
|
|
|
|
|
|
|
|
def excludeRules = configurations.jarValidation.excludeRules
|
|
|
|
|
|
|
|
ArrayDeque<ResolvedDependency> queue = new ArrayDeque<>()
|
|
|
|
configurations.jarValidation.extendsFrom.each { conf ->
|
|
|
|
if (excludeRules) {
|
2020-06-23 16:10:49 -04:00
|
|
|
conf = conf.copyRecursive()
|
|
|
|
conf.canBeResolved = true
|
|
|
|
conf.canBeConsumed = true
|
2020-01-27 11:29:59 -05:00
|
|
|
conf.excludeRules = excludeRules
|
|
|
|
}
|
|
|
|
if (conf.canBeResolved) {
|
|
|
|
queue.addAll(conf.resolvedConfiguration.firstLevelModuleDependencies)
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
def visited = new HashSet<>()
|
2023-10-03 16:44:55 -04:00
|
|
|
def seenDeps = new HashSet<>()
|
2020-01-27 11:29:59 -05:00
|
|
|
def infos = []
|
|
|
|
|
|
|
|
while (!queue.isEmpty()) {
|
|
|
|
def dep = queue.removeFirst()
|
2023-10-03 16:44:55 -04:00
|
|
|
seenDeps.add(dep)
|
2020-01-27 11:29:59 -05:00
|
|
|
|
|
|
|
// Skip any artifacts from Lucene modules.
|
2021-03-18 06:04:45 -04:00
|
|
|
if (!dep.moduleGroup.startsWith("org.apache.lucene")) {
|
2023-10-03 16:44:55 -04:00
|
|
|
// Make sure we don't keep visiting the same children over and over again
|
|
|
|
dep.children.each { child ->
|
|
|
|
if (!seenDeps.contains(child)) {
|
|
|
|
queue.add(child)
|
|
|
|
}
|
|
|
|
}
|
2020-01-27 11:29:59 -05:00
|
|
|
dep.moduleArtifacts.each { resolvedArtifact ->
|
|
|
|
def file = resolvedArtifact.file
|
|
|
|
if (visited.add(file)) {
|
|
|
|
infos.add([
|
|
|
|
name : resolvedArtifact.name,
|
|
|
|
jarName : file.toPath().getFileName().toString(),
|
|
|
|
path : file,
|
|
|
|
module : resolvedArtifact.moduleVersion,
|
2020-10-08 15:25:51 -04:00
|
|
|
checksum : provider { new DigestUtils(DigestUtils.sha1Digest).digestAsHex(file).trim() },
|
2020-01-27 11:29:59 -05:00
|
|
|
// We keep track of the files referenced by this dependency (sha, license, notice, etc.)
|
|
|
|
// so that we can determine unused dangling files later on.
|
|
|
|
referencedFiles: []
|
|
|
|
])
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
project.ext.jarInfos = infos.sort {a, b -> "${a.module}".compareTo("${b.module}")}
|
|
|
|
// jarInfos.each { info -> println "${info.module}" }
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Verifies that each JAR has a corresponding checksum and that it matches actual JAR available for this dependency.
|
|
|
|
task validateJarChecksums() {
|
|
|
|
group = 'Dependency validation'
|
|
|
|
description = "Validate checksums of dependencies"
|
|
|
|
dependsOn collectJarInfos
|
|
|
|
|
|
|
|
doLast {
|
|
|
|
def errors = []
|
|
|
|
jarInfos.each { dep ->
|
|
|
|
def expectedChecksumFile = file("${licensesDir}/${dep.jarName}.sha1")
|
|
|
|
if (!expectedChecksumFile.exists()) {
|
|
|
|
errors << "Dependency checksum missing ('${dep.module}'), expected it at: ${expectedChecksumFile}"
|
|
|
|
} else {
|
|
|
|
dep.referencedFiles += expectedChecksumFile
|
|
|
|
def expected = expectedChecksumFile.getText("UTF-8").trim()
|
|
|
|
def actual = dep.checksum.get()
|
|
|
|
if (expected.compareToIgnoreCase(actual) != 0) {
|
|
|
|
errors << "Dependency checksum mismatch ('${dep.module}'), expected it to be: ${expected}, but was: ${actual}"
|
|
|
|
} else {
|
|
|
|
logger.log(LogLevel.INFO, "Dependency checksum OK ('${dep.module}')")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
if (errors) {
|
|
|
|
def msg = "Dependency checksum validation failed:\n - " + errors.join("\n - ")
|
|
|
|
if (failOnError) {
|
|
|
|
throw new GradleException(msg)
|
|
|
|
} else {
|
|
|
|
logger.log(LogLevel.WARN, "WARNING: ${msg}")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Locate the set of license file candidates for this dependency. We
|
|
|
|
// search for [jar-or-prefix]-LICENSE-[type].txt
|
|
|
|
// where 'jar-or-prefix' can be any '-'-delimited prefix of the dependency JAR's name.
|
|
|
|
// So for 'commons-io' it can be 'commons-io-LICENSE-foo.txt' or
|
|
|
|
// 'commons-LICENSE.txt'
|
2023-03-06 13:17:37 -05:00
|
|
|
tasks.register('validateJarLicenses') {
|
2020-01-27 11:29:59 -05:00
|
|
|
group = 'Dependency validation'
|
|
|
|
description = "Validate license and notice files of dependencies"
|
|
|
|
dependsOn collectJarInfos
|
|
|
|
|
2023-03-06 13:17:37 -05:00
|
|
|
def outputFileName = 'validateJarLicenses'
|
|
|
|
inputs.dir(file(project.rootDir.path + '/lucene/licenses'))
|
|
|
|
.withPropertyName('licenses')
|
|
|
|
.withPathSensitivity(PathSensitivity.RELATIVE)
|
|
|
|
outputs.file(layout.buildDirectory.file(outputFileName))
|
|
|
|
.withPropertyName('validateJarLicensesResult')
|
|
|
|
|
2020-01-27 11:29:59 -05:00
|
|
|
doLast {
|
|
|
|
def errors = []
|
|
|
|
jarInfos.each { dep ->
|
|
|
|
def baseName = dep.name
|
|
|
|
def found = []
|
|
|
|
def candidates = []
|
|
|
|
while (true) {
|
|
|
|
candidates += file("${licensesDir}/${baseName}-LICENSE-[type].txt")
|
|
|
|
found += fileTree(dir: licensesDir, include: "${baseName}-LICENSE-*.txt").files
|
|
|
|
def prefix = baseName.replaceAll(/[\-][^-]+$/, "")
|
|
|
|
if (found || prefix == baseName) {
|
|
|
|
break
|
|
|
|
}
|
|
|
|
baseName = prefix
|
|
|
|
}
|
|
|
|
|
|
|
|
if (found.size() == 0) {
|
|
|
|
errors << "License file missing ('${dep.module}'), expected it at: ${candidates.join(" or ")}," +
|
|
|
|
" where [type] can be any of ${licenseTypes.keySet()}."
|
|
|
|
} else if (found.size() > 1) {
|
|
|
|
errors << "Multiple license files matching for ('${dep.module}'): ${found.join(", ")}"
|
|
|
|
} else {
|
|
|
|
def licenseFile = found.get(0)
|
|
|
|
dep.referencedFiles += licenseFile
|
|
|
|
def m = (licenseFile.name =~ /LICENSE-(.+)\.txt$/)
|
|
|
|
if (!m) throw new GradleException("License file name doesn't contain license type?: ${licenseFile.name}")
|
|
|
|
|
|
|
|
def licenseName = m[0][1]
|
|
|
|
def licenseType = licenseTypes[licenseName]
|
|
|
|
if (!licenseType) {
|
|
|
|
errors << "Unknown license type suffix for ('${dep.module}'): ${licenseFile} (must be one of ${licenseTypes.keySet()})"
|
|
|
|
} else {
|
|
|
|
logger.log(LogLevel.INFO, "Dependency license file OK ('${dep.module}'): " + licenseName)
|
|
|
|
|
|
|
|
// Look for sibling NOTICE file.
|
|
|
|
def noticeFile = file(licenseFile.path.replaceAll(/\-LICENSE-.+/, "-NOTICE.txt"))
|
|
|
|
if (noticeFile.exists()) {
|
|
|
|
dep.referencedFiles += noticeFile
|
|
|
|
logger.log(LogLevel.INFO, "Dependency notice file OK ('${dep.module}'): " + noticeFile)
|
|
|
|
} else if (!licenseType.noticeOptional) {
|
|
|
|
errors << "Notice file missing for ('${dep.module}'), expected it at: ${noticeFile}"
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
2023-03-06 13:17:37 -05:00
|
|
|
// Required to take advantage of incremental building and the build cache
|
|
|
|
def f = new File(project.buildDir.path + "/" + outputFileName)
|
|
|
|
f.write(errors.toString(), "UTF-8")
|
2020-01-27 11:29:59 -05:00
|
|
|
if (errors) {
|
|
|
|
def msg = "Certain license/ notice files are missing:\n - " + errors.join("\n - ")
|
|
|
|
if (failOnError) {
|
|
|
|
throw new GradleException(msg)
|
|
|
|
} else {
|
|
|
|
logger.log(LogLevel.WARN, "WARNING: ${msg}")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
licenses.dependsOn validateJarChecksums, validateJarLicenses
|
|
|
|
}
|
|
|
|
|
|
|
|
// Add top-project level tasks validating dangling files
|
|
|
|
// and regenerating dependency checksums.
|
2021-03-08 08:59:08 -05:00
|
|
|
|
2021-03-18 06:04:45 -04:00
|
|
|
configure(project(":lucene")) {
|
2020-01-27 11:29:59 -05:00
|
|
|
def validationTasks = subprojects.collectMany { it.tasks.matching { it.name == "licenses" } }
|
|
|
|
def jarInfoTasks = subprojects.collectMany { it.tasks.matching { it.name == "collectJarInfos" } }
|
|
|
|
|
|
|
|
// Update dependency checksums.
|
|
|
|
task updateLicenses() {
|
|
|
|
group = 'Dependency validation'
|
2020-04-04 16:14:57 -04:00
|
|
|
description = "Write or update checksums of dependencies. May need to run gradlew --write-locks first if changing dependency versions"
|
2020-01-27 11:29:59 -05:00
|
|
|
dependsOn jarInfoTasks
|
|
|
|
|
|
|
|
doLast {
|
|
|
|
licensesDir.mkdirs()
|
|
|
|
|
|
|
|
// Clean any previous checksums. In theory we wouldn't have to do it --
|
|
|
|
// dangling files from any previous JARs would be reported;
|
|
|
|
// it automates the process of updating versions and makes it easier though so
|
|
|
|
// why not.
|
|
|
|
project.delete fileTree(licensesDir, {
|
|
|
|
include "*.sha1"
|
|
|
|
exclude checkDanglingLicenseFiles.ext.exclude
|
|
|
|
})
|
|
|
|
|
|
|
|
def updated = []
|
|
|
|
jarInfoTasks.collectMany { task -> task.project.jarInfos }.each { dep ->
|
|
|
|
def expectedChecksumFile = file("${licensesDir}/${dep.jarName}.sha1")
|
|
|
|
def actual = dep.checksum.get()
|
|
|
|
if (expectedChecksumFile.exists()) {
|
|
|
|
def expected = expectedChecksumFile.getText("UTF-8").trim()
|
|
|
|
if (expected.compareToIgnoreCase(actual) == 0) {
|
|
|
|
return;
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
updated += "Updated checksum ('${dep.module}'): ${expectedChecksumFile}"
|
|
|
|
expectedChecksumFile.write(actual + "\n", "UTF-8")
|
|
|
|
}
|
|
|
|
|
|
|
|
updated.sort().each { line -> logger.log(LogLevel.LIFECYCLE, line) }
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
// Any validation task must run after all updates have been applied.
|
|
|
|
// We add an ordering constraint that any validation task (or its dependency subgraph)
|
|
|
|
// must run after updateLicenses
|
|
|
|
validationTasks
|
|
|
|
.collectMany { task -> [task, task.dependsOn]}
|
|
|
|
.flatten()
|
|
|
|
.each { task ->
|
|
|
|
task.mustRunAfter updateLicenses
|
|
|
|
}
|
|
|
|
|
|
|
|
// Check for dangling files in the licenses folder.
|
|
|
|
task checkDanglingLicenseFiles() {
|
|
|
|
dependsOn validationTasks
|
|
|
|
|
|
|
|
ext {
|
2021-10-27 14:40:29 -04:00
|
|
|
// Exclude files that are not a result of direct dependencies but have to be there.
|
|
|
|
// It would be probably better to move non-dependency licenses into the actual project
|
|
|
|
// where they're used and only assemble them for the distribution package.
|
|
|
|
exclude = [
|
|
|
|
// Used by Luke.
|
|
|
|
"elegant-icon-font-*",
|
|
|
|
// glove knn dictionary.
|
2021-10-30 13:52:57 -04:00
|
|
|
"glove-LICENSE-PDDL.txt",
|
2021-10-27 14:40:29 -04:00
|
|
|
]
|
2020-01-27 11:29:59 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
doFirst {
|
2021-02-17 18:12:27 -05:00
|
|
|
def allReferenced = validationTasks
|
|
|
|
// Only collect for enabled tasks: https://issues.apache.org/jira/browse/LUCENE-9780
|
|
|
|
.findAll { it.enabled }
|
|
|
|
.collectMany { task ->
|
|
|
|
task.project.jarInfos.collectMany { it.referencedFiles }
|
|
|
|
}
|
|
|
|
.collect { it.toString() }
|
2020-01-27 11:29:59 -05:00
|
|
|
|
|
|
|
def patterns = ext.exclude
|
|
|
|
def allExisting = fileTree(licensesDir, {
|
|
|
|
exclude patterns
|
|
|
|
}).files.collect { it.toString() }
|
|
|
|
|
|
|
|
def dangling = (allExisting - allReferenced).sort()
|
|
|
|
|
|
|
|
if (dangling) {
|
|
|
|
gradle.buildFinished {
|
|
|
|
logger.warn("WARNING: there were unreferenced files under license folder:\n - ${dangling.join("\n - ")}")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
licenses.dependsOn checkDanglingLicenseFiles
|
|
|
|
}
|