/* * Licensed to the Apache Software Foundation (ASF) under one or more * contributor license agreements. See the NOTICE file distributed with * this work for additional information regarding copyright ownership. * The ASF licenses this file to You under the Apache License, Version 2.0 * (the "License"); you may not use this file except in compliance with * the License. You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ import org.apache.rat.Defaults import org.apache.rat.document.impl.FileDocument import org.apache.rat.api.MetaData import javax.inject.Inject; import org.gradle.internal.logging.progress.ProgressLoggerFactory import org.gradle.internal.logging.progress.ProgressLogger buildscript { repositories { mavenCentral() } dependencies { classpath "org.apache.rat:apache-rat:${scriptDepVersions['apache-rat']}" } } def extensions = [ 'adoc', 'bat', 'cmd', 'css', 'g4', 'gradle', 'groovy', 'html', 'java', 'jflex', 'jj', 'js', 'json', 'md', 'mdtext', 'pl', 'policy', 'properties', 'py', 'sh', 'template', 'vm', 'xml', 'xsl', ] // Create source validation task local for each project's files. subprojects { task validateSourcePatterns(type: ValidateSourcePatternsTask) { task -> group = 'Verification' description = 'Validate Source Patterns' // This task has no proper outputs. setupDummyOutputs(task) sourceFiles = fileTree(projectDir) { extensions.each{ include "**/*.${it}" } // Don't go into child projects (scanned separately). childProjects.keySet().each{ exclude "${it}/**" } // default excludes. exclude 'build/**' } } // Add source validation to per-project checks as well. check.dependsOn validateSourcePatterns } configure(project(':lucene:benchmark')) { project.tasks.withType(ValidateSourcePatternsTask) { sourceFiles.exclude 'temp/**' sourceFiles.exclude 'work/**' } } configure(project(':solr:core')) { project.tasks.withType(ValidateSourcePatternsTask) { sourceFiles.exclude 'src/**/CheckLoggingConfiguration.java' sourceFiles.exclude 'src/test/org/apache/hadoop/**' } } configure(rootProject) { task validateSourcePatterns(type: ValidateSourcePatternsTask) { task -> group = 'Verification' description = 'Validate Source Patterns' // This task has no proper outputs. setupDummyOutputs(task) sourceFiles = fileTree(projectDir) { extensions.each{ include "**/*.${it}" } // We do not scan for *.txt by default (broken files in subprojects), // but in root we can do this). include '**/*.txt' // Don't go into child projects (scanned separately). childProjects.keySet().each{ exclude "${it}/**" } // default excludes. exclude '**/build/**' exclude 'dev-tools/missing-doclet/src/**/*.java' // <-- TODO: remove once we allow "var" on master // ourselves :-) exclude 'gradle/validation/validate-source-patterns.gradle' } } check.dependsOn validateSourcePatterns } class ValidateSourcePatternsTask extends DefaultTask { private ProgressLoggerFactory progressLoggerFactory @InputFiles FileTree sourceFiles @Inject ValidateSourcePatternsTask(ProgressLoggerFactory progressLoggerFactory) { this.progressLoggerFactory = progressLoggerFactory } @TaskAction public void check() { def invalidPatterns = [ (~$/@author\b/$) : '@author javadoc tag', (~$/(?i)\bno(n|)commit\b/$) : 'nocommit', (~$/\bTOOD:/$) : 'TOOD instead TODO', (~$/\t/$) : 'tabs instead spaces', (~$/\Q/**\E((?:\s)|(?:\*))*\Q{@inheritDoc}\E((?:\s)|(?:\*))*\Q*/\E/$) : '{@inheritDoc} on its own is unnecessary', (~$/\$$(?:LastChanged)?Date\b/$) : 'svn keyword', (~$/\$$(?:(?:LastChanged)?Revision|Rev)\b/$) : 'svn keyword', (~$/\$$(?:LastChangedBy|Author)\b/$) : 'svn keyword', (~$/\$$(?:Head)?URL\b/$) : 'svn keyword', (~$/\$$Id\b/$) : 'svn keyword', (~$/\$$Header\b/$) : 'svn keyword', (~$/\$$Source\b/$) : 'svn keyword', (~$/^\uFEFF/$) : 'UTF-8 byte order mark', (~$/import java\.lang\.\w+;/$) : 'java.lang import is unnecessary' ] // Python and others merrily use var declarations, this is a problem _only_ in Java at least for 8x where we're forbidding var declarations def invalidJavaOnlyPatterns = [ (~$/\n\s*var\s+.*=.*<>.*/$) : 'Diamond operators should not be used with var', (~$/\n\s*var\s+/$) : 'var is not allowed in until we stop development on the 8x code line' ] def found = 0; def violations = new TreeSet(); def reportViolation = { f, name -> logger.error('{}: {}', name, f); violations.add(name); found++; } def javadocsPattern = ~$/(?sm)^\Q/**\E(.*?)\Q*/\E/$; def javaCommentPattern = ~$/(?sm)^\Q/*\E(.*?)\Q*/\E/$; def xmlCommentPattern = ~$/(?sm)\Q\E/$; def lineSplitter = ~$/[\r\n]+/$; def singleLineSplitter = ~$/\r?\n/$; def licenseMatcher = Defaults.createDefaultMatcher(); def validLoggerPattern = ~$/(?s)\b(private\s|static\s|final\s){3}+\s*Logger\s+\p{javaJavaIdentifierStart}+\s+=\s+\QLoggerFactory.getLogger(MethodHandles.lookup().lookupClass());\E/$; def validLoggerNamePattern = ~$/(?s)\b(private\s|static\s|final\s){3}+\s*Logger\s+log+\s+=\s+\QLoggerFactory.getLogger(MethodHandles.lookup().lookupClass());\E/$; def packagePattern = ~$/(?m)^\s*package\s+org\.apache.*;/$; def xmlTagPattern = ~$/(?m)\s*<[a-zA-Z].*/$; def sourceHeaderPattern = ~$/\[source\b.*/$; def blockBoundaryPattern = ~$/----\s*/$; def blockTitlePattern = ~$/\..*/$; def unescapedSymbolPattern = ~$/(?<=[^\\]|^)([-=]>|<[-=])/$; // SOLR-10883 def extendsLuceneTestCasePattern = ~$/public.*?class.*?extends.*?LuceneTestCase[^\n]*?\n/$; def validSPINameJavadocTag = ~$/(?s)\s*\*\s*@lucene\.spi\s+\{@value #NAME\}/$; def isLicense = { matcher, ratDocument -> licenseMatcher.reset(); return lineSplitter.split(matcher.group(1)).any{ licenseMatcher.match(ratDocument, it) }; } def checkLicenseHeaderPrecedes = { f, description, contentPattern, commentPattern, text, ratDocument -> def contentMatcher = contentPattern.matcher(text); if (contentMatcher.find()) { def contentStartPos = contentMatcher.start(); def commentMatcher = commentPattern.matcher(text); while (commentMatcher.find()) { if (isLicense(commentMatcher, ratDocument)) { if (commentMatcher.start() < contentStartPos) { break; // This file is all good, so break loop: license header precedes 'description' definition } else { reportViolation(f, description+' declaration precedes license header'); } } } } } def checkMockitoAssume = { f, text -> if (text.contains("mockito") && !text.contains("assumeWorkingMockito()")) { reportViolation(f, 'File uses Mockito but has no assumeWorkingMockito() call'); } } def checkForUnescapedSymbolSubstitutions = { f, text -> def inCodeBlock = false; def underSourceHeader = false; def lineNumber = 0; singleLineSplitter.split(text).each { ++lineNumber; if (underSourceHeader) { // This line is either a single source line, or the boundary of a code block inCodeBlock = blockBoundaryPattern.matcher(it).matches(); if ( ! blockTitlePattern.matcher(it).matches()) { underSourceHeader = false; } } else { if (inCodeBlock) { inCodeBlock = ! blockBoundaryPattern.matcher(it).matches(); } else { underSourceHeader = sourceHeaderPattern.matcher(it).lookingAt(); if ( ! underSourceHeader) { def unescapedSymbolMatcher = unescapedSymbolPattern.matcher(it); if (unescapedSymbolMatcher.find()) { reportViolation(f, 'Unescaped symbol "' + unescapedSymbolMatcher.group(1) + '" on line #' + lineNumber); } } } } } } ProgressLogger progress = progressLoggerFactory.newOperation(this.class) progress.start(this.name, this.name) sourceFiles.each{ f -> progress.progress("Scanning ${f.name}") logger.debug('Scanning source file: {}', f); def text = f.getText('UTF-8'); invalidPatterns.each{ pattern,name -> if (pattern.matcher(text).find()) { reportViolation(f, name); } } def javadocsMatcher = javadocsPattern.matcher(text); def ratDocument = new FileDocument(f); while (javadocsMatcher.find()) { if (isLicense(javadocsMatcher, ratDocument)) { reportViolation(f, String.format(Locale.ENGLISH, 'javadoc-style license header [%s]', ratDocument.getMetaData().value(MetaData.RAT_URL_LICENSE_FAMILY_NAME))); } } if (f.name.endsWith('.java')) { if (text.contains('org.slf4j.LoggerFactory')) { if (!validLoggerPattern.matcher(text).find()) { reportViolation(f, 'invalid logging pattern [not private static final, uses static class name]'); } if (!validLoggerNamePattern.matcher(text).find()) { reportViolation(f, 'invalid logger name [log, uses static class name, not specialized logger]') } } // make sure that SPI names of all tokenizers/charfilters/tokenfilters are documented if (!f.name.contains("Test") && !f.name.contains("Mock") && !text.contains("abstract class") && !f.name.equals("TokenizerFactory.java") && !f.name.equals("CharFilterFactory.java") && !f.name.equals("TokenFilterFactory.java") && (f.name.contains("TokenizerFactory") && text.contains("extends TokenizerFactory") || f.name.contains("CharFilterFactory") && text.contains("extends CharFilterFactory") || f.name.contains("FilterFactory") && text.contains("extends TokenFilterFactory"))) { if (!validSPINameJavadocTag.matcher(text).find()) { reportViolation(f, 'invalid spi name documentation') } } checkLicenseHeaderPrecedes(f, 'package', packagePattern, javaCommentPattern, text, ratDocument); if (f.name.contains("Test")) { checkMockitoAssume(f, text); } if (project.path.startsWith(':solr:') && f.name.equals("SolrTestCase.java") == false && f.name.equals("TestXmlQParser.java") == false) { if (extendsLuceneTestCasePattern.matcher(text).find()) { reportViolation(f, "Solr test cases should extend SolrTestCase rather than LuceneTestCase"); } } invalidJavaOnlyPatterns.each { pattern,name -> if (pattern.matcher(text).find()) { reportViolation(f, name); } } } if (f.name.endsWith('.xml')) { checkLicenseHeaderPrecedes(f, '', xmlTagPattern, xmlCommentPattern, text, ratDocument); } if (f.name.endsWith('.adoc')) { checkForUnescapedSymbolSubstitutions(f, text); } } progress.completed() if (found) { throw new GradleException(String.format(Locale.ENGLISH, 'Found %d violations in source files (%s).', found, violations.join(', '))); } } }