From 1c32cc9a49d8e692949f92a8a517300e498e1a55 Mon Sep 17 00:00:00 2001 From: Dawid Weiss Date: Fri, 4 Nov 2016 16:02:00 +0100 Subject: [PATCH] SOLR-7539: Upgrade the clustering plugin to Carrot2 3.15.0. --- lucene/ivy-versions.properties | 2 +- solr/CHANGES.txt | 4 +- .../clustering/ClusteringComponent.java | 12 ++--- .../carrot2/CarrotClusteringEngine.java | 29 +++++------ .../clustering/carrot2/CarrotParams.java | 10 ++-- ...olrStopwordsCarrot2LexicalDataFactory.java | 49 ++++++++++--------- .../carrot2/CarrotClusteringEngineTest.java | 27 +++++----- .../carrot2/EchoClusteringAlgorithm.java | 5 +- .../carrot2/EchoStemsClusteringAlgorithm.java | 5 +- .../EchoTokensClusteringAlgorithm.java | 5 +- ...icalResourcesCheckClusteringAlgorithm.java | 5 +- .../carrot2/MockClusteringAlgorithm.java | 4 +- solr/licenses/carrot2-mini-3.12.0.jar.sha1 | 1 - solr/licenses/carrot2-mini-3.15.0.jar.sha1 | 1 + 14 files changed, 77 insertions(+), 82 deletions(-) delete mode 100644 solr/licenses/carrot2-mini-3.12.0.jar.sha1 create mode 100644 solr/licenses/carrot2-mini-3.15.0.jar.sha1 diff --git a/lucene/ivy-versions.properties b/lucene/ivy-versions.properties index b92112d8347..c4d1c1163a4 100644 --- a/lucene/ivy-versions.properties +++ b/lucene/ivy-versions.properties @@ -222,7 +222,7 @@ org.bouncycastle.version = 1.45 /org.carrot2.attributes/attributes-binder = 1.3.1 /org.carrot2.shaded/carrot2-guava = 18.0 -/org.carrot2/carrot2-mini = 3.12.0 +/org.carrot2/carrot2-mini = 3.15.0 org.carrot2.morfologik.version = 2.1.1 /org.carrot2/morfologik-fsa = ${org.carrot2.morfologik.version} diff --git a/solr/CHANGES.txt b/solr/CHANGES.txt index fac3759144e..b1786a8b012 100644 --- a/solr/CHANGES.txt +++ b/solr/CHANGES.txt @@ -23,7 +23,7 @@ Consult the LUCENE_CHANGES.txt file for additional, low level, changes in this r Versions of Major Components --------------------- Apache Tika 1.13 -Carrot2 3.12.0 +Carrot2 3.15.0 Velocity 1.7 and Velocity Tools 2.0 Apache UIMA 2.3.1 Apache ZooKeeper 3.4.6 @@ -58,6 +58,8 @@ Bug Fixes Other Changes ---------------------- +* SOLR-7539: Upgrade the clustering plugin to Carrot2 3.15.0. (Dawid Weiss) + * SOLR-9621: Remove several Guava & Apache Commons calls in favor of java 8 alternatives. (Michael Braun via David Smiley) diff --git a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/ClusteringComponent.java b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/ClusteringComponent.java index 42a2de98ae8..6275c906f02 100644 --- a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/ClusteringComponent.java +++ b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/ClusteringComponent.java @@ -19,6 +19,7 @@ package org.apache.solr.handler.clustering; import java.io.IOException; import java.lang.invoke.MethodHandles; import java.util.Collections; +import java.util.HashMap; import java.util.HashSet; import java.util.LinkedHashMap; import java.util.Map; @@ -44,9 +45,6 @@ import org.apache.solr.util.plugin.SolrCoreAware; import org.slf4j.Logger; import org.slf4j.LoggerFactory; -import com.google.common.collect.Maps; - - /** * Provides a plugin for performing cluster analysis. This can either be applied to * search results (e.g., via Carrot2) or for @@ -68,12 +66,12 @@ public class ClusteringComponent extends SearchComponent implements SolrCoreAwar /** * Declaration-order list of search clustering engines. */ - private final LinkedHashMap searchClusteringEngines = Maps.newLinkedHashMap(); - + private final LinkedHashMap searchClusteringEngines = new LinkedHashMap<>(); + /** * Declaration order list of document clustering engines. */ - private final LinkedHashMap documentClusteringEngines = Maps.newLinkedHashMap(); + private final LinkedHashMap documentClusteringEngines = new LinkedHashMap<>(); /** * An unmodifiable view of {@link #searchClusteringEngines}. @@ -173,7 +171,7 @@ public class ClusteringComponent extends SearchComponent implements SolrCoreAwar if (engine != null) { checkAvailable(name, engine); DocListAndSet results = rb.getResults(); - Map docIds = Maps.newHashMapWithExpectedSize(results.docList.size()); + Map docIds = new HashMap<>(results.docList.size()); SolrDocumentList solrDocList = SolrPluginUtils.docListToSolrDocumentList( results.docList, rb.req.getSearcher(), engine.getFieldsToLoad(rb.req), docIds); Object clusters = engine.cluster(rb.getQuery(), solrDocList, docIds, rb.req); diff --git a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java index a8548eceb8c..951cce5c4b0 100644 --- a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java +++ b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngine.java @@ -58,6 +58,8 @@ import org.carrot2.core.Document; import org.carrot2.core.IClusteringAlgorithm; import org.carrot2.core.LanguageCode; import org.carrot2.core.attribute.AttributeNames; +import org.carrot2.shaded.guava.common.base.MoreObjects; +import org.carrot2.shaded.guava.common.base.Strings; import org.carrot2.text.linguistic.DefaultLexicalDataFactoryDescriptor; import org.carrot2.text.preprocessing.pipeline.BasicPreprocessingPipelineDescriptor; import org.carrot2.text.preprocessing.pipeline.BasicPreprocessingPipelineDescriptor.AttributeBuilder; @@ -69,12 +71,6 @@ import org.carrot2.util.resource.ResourceLookup; import org.slf4j.Logger; import org.slf4j.LoggerFactory; -import com.google.common.base.Objects; -import com.google.common.base.Strings; -import com.google.common.collect.Lists; -import com.google.common.collect.Maps; -import com.google.common.collect.Sets; - /** * Search results clustering engine based on Carrot2 clustering algorithms. * @@ -155,7 +151,8 @@ public class CarrotClusteringEngine extends SearchClusteringEngine { // Load Carrot2-Workbench exported attribute XMLs based on the 'name' attribute // of this component. This by-name convention lookup is used to simplify configuring algorithms. String componentName = initParams.get(ClusteringEngine.ENGINE_NAME); - log.info("Initializing Clustering Engine '" + Objects.firstNonNull(componentName, "") + "'"); + log.info("Initializing Clustering Engine '" + + MoreObjects.firstNonNull(componentName, "") + "'"); if (!Strings.isNullOrEmpty(componentName)) { IResource[] attributeXmls = resourceLookup.getAll(componentName + "-attributes.xml"); @@ -268,7 +265,7 @@ public class CarrotClusteringEngine extends SearchClusteringEngine { protected Set getFieldsToLoad(SolrQueryRequest sreq){ SolrParams solrParams = sreq.getParams(); - HashSet fields = Sets.newHashSet(getFieldsForClustering(sreq)); + HashSet fields = new HashSet<>(getFieldsForClustering(sreq)); fields.add(idFieldName); fields.add(solrParams.get(CarrotParams.URL_FIELD_NAME, "url")); fields.addAll(getCustomFieldsMap(solrParams).keySet()); @@ -295,7 +292,7 @@ public class CarrotClusteringEngine extends SearchClusteringEngine { + " must not be blank."); } - final Set fields = Sets.newHashSet(); + final Set fields = new HashSet<>(); fields.addAll(Arrays.asList(titleFieldSpec.split("[, ]"))); fields.addAll(Arrays.asList(snippetFieldSpec.split("[, ]"))); return fields; @@ -319,7 +316,7 @@ public class CarrotClusteringEngine extends SearchClusteringEngine { Map customFields = getCustomFieldsMap(solrParams); // Parse language code map string into a map - Map languageCodeMap = Maps.newHashMap(); + Map languageCodeMap = new HashMap<>(); if (StringUtils.isNotBlank(languageField)) { for (String pair : solrParams.get(CarrotParams.LANGUAGE_CODE_MAP, "").split("[, ]")) { final String[] split = pair.split(":"); @@ -340,7 +337,7 @@ public class CarrotClusteringEngine extends SearchClusteringEngine { if (produceSummary) { highlighter = HighlightComponent.getHighlighter(core); if (highlighter != null){ - Map args = Maps.newHashMap(); + Map args = new HashMap<>(); snippetFieldAry = snippetFieldSpec.split("[, ]"); args.put(HighlightParams.FIELDS, snippetFieldAry); args.put(HighlightParams.HIGHLIGHT, "true"); @@ -466,10 +463,10 @@ public class CarrotClusteringEngine extends SearchClusteringEngine { * custom field names. */ private Map getCustomFieldsMap(SolrParams solrParams) { - Map customFields = Maps.newHashMap(); + Map customFields = new HashMap<>(); String [] customFieldsSpec = solrParams.getParams(CarrotParams.CUSTOM_FIELD_NAME); if (customFieldsSpec != null) { - customFields = Maps.newHashMap(); + customFields = new HashMap<>(); for (String customFieldSpec : customFieldsSpec) { String [] split = customFieldSpec.split(":"); if (split.length == 2 && StringUtils.isNotBlank(split[0]) && StringUtils.isNotBlank(split[1])) { @@ -501,7 +498,7 @@ public class CarrotClusteringEngine extends SearchClusteringEngine { private List> clustersToNamedList(List carrotClusters, SolrParams solrParams) { - List> result = Lists.newArrayList(); + List> result = new ArrayList<>(); clustersToNamedList(carrotClusters, result, solrParams.getBool( CarrotParams.OUTPUT_SUB_CLUSTERS, true), solrParams.getInt( CarrotParams.NUM_DESCRIPTIONS, Integer.MAX_VALUE)); @@ -534,7 +531,7 @@ public class CarrotClusteringEngine extends SearchClusteringEngine { // Add documents List docs = outputSubClusters ? outCluster.getDocuments() : outCluster.getAllDocuments(); - List docList = Lists.newArrayList(); + List docList = new ArrayList<>(); cluster.add("docs", docList); for (Document doc : docs) { docList.add(doc.getField(SOLR_DOCUMENT_ID)); @@ -542,7 +539,7 @@ public class CarrotClusteringEngine extends SearchClusteringEngine { // Add subclusters if (outputSubClusters && !outCluster.getSubclusters().isEmpty()) { - List> subclusters = Lists.newArrayList(); + List> subclusters = new ArrayList<>(); cluster.add("clusters", subclusters); clustersToNamedList(outCluster.getSubclusters(), subclusters, outputSubClusters, maxLabels); diff --git a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotParams.java b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotParams.java index 71a22fe9343..d0fb0d5ded7 100644 --- a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotParams.java +++ b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/CarrotParams.java @@ -16,10 +16,10 @@ */ package org.apache.solr.handler.clustering.carrot2; +import java.util.Arrays; +import java.util.HashSet; import java.util.Set; -import com.google.common.collect.ImmutableSet; - /** * Carrot2 parameter mapping (recognized and mapped if passed via Solr configuration). * @lucene.experimental @@ -50,7 +50,7 @@ public final class CarrotParams { */ public static String RESOURCES_DIR = CARROT_PREFIX + "resourcesDir"; - static final Set CARROT_PARAM_NAMES = ImmutableSet.of( + static final Set CARROT_PARAM_NAMES = new HashSet<>(Arrays.asList( ALGORITHM, TITLE_FIELD_NAME, @@ -66,8 +66,8 @@ public final class CarrotParams { NUM_DESCRIPTIONS, OUTPUT_SUB_CLUSTERS, RESOURCES_DIR, - LANGUAGE_CODE_MAP); - + LANGUAGE_CODE_MAP)); + /** No instances. */ private CarrotParams() {} } diff --git a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/SolrStopwordsCarrot2LexicalDataFactory.java b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/SolrStopwordsCarrot2LexicalDataFactory.java index 3caaf54f27a..569b1bb2307 100644 --- a/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/SolrStopwordsCarrot2LexicalDataFactory.java +++ b/solr/contrib/clustering/src/java/org/apache/solr/handler/clustering/carrot2/SolrStopwordsCarrot2LexicalDataFactory.java @@ -16,7 +16,9 @@ */ package org.apache.solr.handler.clustering.carrot2; -import java.util.Collection; +import java.util.ArrayList; +import java.util.HashMap; +import java.util.List; import java.util.Set; import org.apache.lucene.analysis.Analyzer; @@ -26,6 +28,7 @@ import org.apache.lucene.analysis.core.StopFilterFactory; import org.apache.lucene.analysis.util.TokenFilterFactory; import org.apache.solr.analysis.TokenizerChain; import org.apache.solr.core.SolrCore; +import org.apache.solr.schema.IndexSchema; import org.carrot2.core.LanguageCode; import org.carrot2.core.attribute.Init; import org.carrot2.core.attribute.Processing; @@ -37,9 +40,6 @@ import org.carrot2.util.attribute.Attribute; import org.carrot2.util.attribute.Bindable; import org.carrot2.util.attribute.Input; -import com.google.common.collect.HashMultimap; -import com.google.common.collect.Multimap; - /** * An implementation of Carrot2's {@link ILexicalDataFactory} that adds stop * words from a field's StopFilter to the default stop words used in Carrot2, @@ -67,7 +67,7 @@ public class SolrStopwordsCarrot2LexicalDataFactory implements ILexicalDataFacto /** * A lazily-built cache of stop words per field. */ - private Multimap solrStopWords = HashMultimap.create(); + private HashMap> solrStopWords = new HashMap<>(); /** * Carrot2's default lexical resources to use in addition to Solr's stop @@ -79,31 +79,34 @@ public class SolrStopwordsCarrot2LexicalDataFactory implements ILexicalDataFacto * Obtains stop words for a field from the associated * {@link StopFilterFactory}, if any. */ - private Collection getSolrStopWordsForField(String fieldName) { + private List getSolrStopWordsForField(String fieldName) { // No need to synchronize here, Carrot2 ensures that instances // of this class are not used by multiple threads at a time. - if (!solrStopWords.containsKey(fieldName)) { - final Analyzer fieldAnalyzer = core.getLatestSchema().getFieldType(fieldName) - .getIndexAnalyzer(); - if (fieldAnalyzer instanceof TokenizerChain) { - final TokenFilterFactory[] filterFactories = ((TokenizerChain) fieldAnalyzer) - .getTokenFilterFactories(); - for (TokenFilterFactory factory : filterFactories) { - if (factory instanceof StopFilterFactory) { - // StopFilterFactory holds the stop words in a CharArraySet - solrStopWords.put(fieldName, - ((StopFilterFactory) factory).getStopWords()); - } + synchronized (solrStopWords) { + if (!solrStopWords.containsKey(fieldName)) { + solrStopWords.put(fieldName, new ArrayList<>()); - if (factory instanceof CommonGramsFilterFactory) { - solrStopWords.put(fieldName, - ((CommonGramsFilterFactory) factory) - .getCommonWords()); + IndexSchema schema = core.getLatestSchema(); + final Analyzer fieldAnalyzer = schema.getFieldType(fieldName).getIndexAnalyzer(); + if (fieldAnalyzer instanceof TokenizerChain) { + final TokenFilterFactory[] filterFactories = + ((TokenizerChain) fieldAnalyzer).getTokenFilterFactories(); + for (TokenFilterFactory factory : filterFactories) { + if (factory instanceof StopFilterFactory) { + // StopFilterFactory holds the stop words in a CharArraySet + CharArraySet stopWords = ((StopFilterFactory) factory).getStopWords(); + solrStopWords.get(fieldName).add(stopWords); + } + + if (factory instanceof CommonGramsFilterFactory) { + CharArraySet commonWords = ((CommonGramsFilterFactory) factory).getCommonWords(); + solrStopWords.get(fieldName).add(commonWords); + } } } } + return solrStopWords.get(fieldName); } - return solrStopWords.get(fieldName); } @Override diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java index 752570de3c1..3d6f3d39e5f 100644 --- a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java +++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/CarrotClusteringEngineTest.java @@ -17,6 +17,9 @@ package org.apache.solr.handler.clustering.carrot2; import java.io.IOException; +import java.util.ArrayList; +import java.util.Arrays; +import java.util.Collections; import java.util.HashMap; import java.util.List; import java.util.Map; @@ -45,9 +48,6 @@ import org.carrot2.core.LanguageCode; import org.carrot2.util.attribute.AttributeUtils; import org.junit.Test; -import com.google.common.collect.ImmutableList; -import com.google.common.collect.Lists; - /** * */ @@ -211,7 +211,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase { // stoplabels.mt, so we're expecting only one cluster with label "online". final List> clusters = checkEngine( getClusteringEngine(engineName), 1, params); - assertEquals(getLabels(clusters.get(0)), ImmutableList.of("online")); + assertEquals(getLabels(clusters.get(0)), Collections.singletonList("online")); } @Test @@ -226,7 +226,7 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase { // only one cluster with label "online". final List> clusters = checkEngine( getClusteringEngine("lexical-resource-check"), 1, params); - assertEquals(getLabels(clusters.get(0)), ImmutableList.of("online")); + assertEquals(getLabels(clusters.get(0)), Collections.singletonList("online")); } @Test @@ -243,9 +243,8 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase { final List> clusters = checkEngine( getClusteringEngine("lexical-resource-check"), 2, params); - assertEquals(ImmutableList.of("online"), getLabels(clusters.get(0))); - assertEquals(ImmutableList.of("solrownstopword"), - getLabels(clusters.get(1))); + assertEquals(Collections.singletonList("online"), getLabels(clusters.get(0))); + assertEquals(Collections.singletonList("solrownstopword"), getLabels(clusters.get(1))); } @Test @@ -395,8 +394,8 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase { ClusteringComponent comp = (ClusteringComponent) h.getCore().getSearchComponent("clustering-name-default"); Map engines = getSearchClusteringEngines(comp); assertEquals( - Lists.newArrayList("stc", "default", "mock"), - Lists.newArrayList(engines.keySet())); + Arrays.asList("stc", "default", "mock"), + new ArrayList<>(engines.keySet())); assertEquals( LingoClusteringAlgorithm.class, ((CarrotClusteringEngine) engines.get(ClusteringEngine.DEFAULT_ENGINE_NAME)).getClusteringAlgorithmClass()); @@ -407,8 +406,8 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase { ClusteringComponent comp = (ClusteringComponent) h.getCore().getSearchComponent("clustering-name-decl-order"); Map engines = getSearchClusteringEngines(comp); assertEquals( - Lists.newArrayList("unavailable", "lingo", "stc", "mock", "default"), - Lists.newArrayList(engines.keySet())); + Arrays.asList("unavailable", "lingo", "stc", "mock", "default"), + new ArrayList<>(engines.keySet())); assertEquals( LingoClusteringAlgorithm.class, ((CarrotClusteringEngine) engines.get(ClusteringEngine.DEFAULT_ENGINE_NAME)).getClusteringAlgorithmClass()); @@ -419,8 +418,8 @@ public class CarrotClusteringEngineTest extends AbstractClusteringTestCase { ClusteringComponent comp = (ClusteringComponent) h.getCore().getSearchComponent("clustering-name-dups"); Map engines = getSearchClusteringEngines(comp); assertEquals( - Lists.newArrayList("", "default"), - Lists.newArrayList(engines.keySet())); + Arrays.asList("", "default"), + new ArrayList<>(engines.keySet())); assertEquals( MockClusteringAlgorithm.class, ((CarrotClusteringEngine) engines.get(ClusteringEngine.DEFAULT_ENGINE_NAME)).getClusteringAlgorithmClass()); diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoClusteringAlgorithm.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoClusteringAlgorithm.java index 5fb13f88519..2c95da3da9a 100644 --- a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoClusteringAlgorithm.java +++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoClusteringAlgorithm.java @@ -15,6 +15,7 @@ * limitations under the License. */ package org.apache.solr.handler.clustering.carrot2; +import java.util.ArrayList; import java.util.List; import org.carrot2.core.Cluster; @@ -29,8 +30,6 @@ import org.carrot2.util.attribute.Bindable; import org.carrot2.util.attribute.Input; import org.carrot2.util.attribute.Output; -import com.google.common.collect.Lists; - /** * A mock Carrot2 clustering algorithm that outputs input documents as clusters. * Useful only in tests. @@ -56,7 +55,7 @@ public class EchoClusteringAlgorithm extends ProcessingComponentBase implements @Override public void process() throws ProcessingException { - clusters = Lists.newArrayListWithCapacity(documents.size()); + clusters = new ArrayList<>(); for (Document document : documents) { final Cluster cluster = new Cluster(); diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoStemsClusteringAlgorithm.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoStemsClusteringAlgorithm.java index dfd762f5211..f39fcd968b8 100644 --- a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoStemsClusteringAlgorithm.java +++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoStemsClusteringAlgorithm.java @@ -16,6 +16,7 @@ */ package org.apache.solr.handler.clustering.carrot2; +import java.util.ArrayList; import java.util.List; import org.carrot2.core.Cluster; @@ -36,8 +37,6 @@ import org.carrot2.util.attribute.Bindable; import org.carrot2.util.attribute.Input; import org.carrot2.util.attribute.Output; -import com.google.common.collect.Lists; - /** * A mock Carrot2 clustering algorithm that outputs stem of each token of each * document as a separate cluster. Useful only in tests. @@ -64,7 +63,7 @@ public class EchoStemsClusteringAlgorithm extends ProcessingComponentBase final AllTokens allTokens = preprocessingContext.allTokens; final AllWords allWords = preprocessingContext.allWords; final AllStems allStems = preprocessingContext.allStems; - clusters = Lists.newArrayListWithCapacity(allTokens.image.length); + clusters = new ArrayList<>(); for (int i = 0; i < allTokens.image.length; i++) { if (allTokens.wordIndex[i] >= 0) { clusters.add(new Cluster(new String( diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoTokensClusteringAlgorithm.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoTokensClusteringAlgorithm.java index 0346209e82e..32e47d82fa6 100644 --- a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoTokensClusteringAlgorithm.java +++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/EchoTokensClusteringAlgorithm.java @@ -16,6 +16,7 @@ */ package org.apache.solr.handler.clustering.carrot2; +import java.util.ArrayList; import java.util.List; import org.carrot2.core.Cluster; @@ -33,7 +34,6 @@ import org.carrot2.util.attribute.Bindable; import org.carrot2.util.attribute.Input; import org.carrot2.util.attribute.Output; -import com.google.common.collect.Lists; /** * A mock Carrot2 clustering algorithm that outputs each token of each document @@ -58,8 +58,7 @@ public class EchoTokensClusteringAlgorithm extends ProcessingComponentBase public void process() throws ProcessingException { final PreprocessingContext preprocessingContext = preprocessing.preprocess( documents, "", LanguageCode.ENGLISH); - clusters = Lists - .newArrayListWithCapacity(preprocessingContext.allTokens.image.length); + clusters = new ArrayList<>(); for (char[] token : preprocessingContext.allTokens.image) { if (token != null) { clusters.add(new Cluster(new String(token))); diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/LexicalResourcesCheckClusteringAlgorithm.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/LexicalResourcesCheckClusteringAlgorithm.java index e32f5af857b..9f69040a9ed 100644 --- a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/LexicalResourcesCheckClusteringAlgorithm.java +++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/LexicalResourcesCheckClusteringAlgorithm.java @@ -16,6 +16,7 @@ */ package org.apache.solr.handler.clustering.carrot2; +import java.util.ArrayList; import java.util.List; import org.carrot2.core.Cluster; @@ -33,8 +34,6 @@ import org.carrot2.util.attribute.Bindable; import org.carrot2.util.attribute.Input; import org.carrot2.util.attribute.Output; -import com.google.common.collect.Lists; - /** * A mock implementation of Carrot2 clustering algorithm for testing whether the * customized lexical resource lookup works correctly. This algorithm ignores @@ -60,7 +59,7 @@ public class LexicalResourcesCheckClusteringAlgorithm extends @Override public void process() throws ProcessingException { - clusters = Lists.newArrayList(); + clusters = new ArrayList<>(); if (wordsToCheck == null) { return; } diff --git a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/MockClusteringAlgorithm.java b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/MockClusteringAlgorithm.java index 899bcbc0e9d..ba978a5dace 100644 --- a/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/MockClusteringAlgorithm.java +++ b/solr/contrib/clustering/src/test/org/apache/solr/handler/clustering/carrot2/MockClusteringAlgorithm.java @@ -15,13 +15,13 @@ * limitations under the License. */ package org.apache.solr.handler.clustering.carrot2; -import com.google.common.collect.Lists; import org.carrot2.core.*; import org.carrot2.core.attribute.AttributeNames; import org.carrot2.core.attribute.Processing; import org.carrot2.util.attribute.*; import org.carrot2.util.attribute.constraint.IntRange; +import java.util.ArrayList; import java.util.List; @Bindable(prefix = "MockClusteringAlgorithm") @@ -62,7 +62,7 @@ public class MockClusteringAlgorithm extends ProcessingComponentBase implements @Override public void process() throws ProcessingException { - clusters = Lists.newArrayList(); + clusters = new ArrayList<>(); if (documents == null) { return; } diff --git a/solr/licenses/carrot2-mini-3.12.0.jar.sha1 b/solr/licenses/carrot2-mini-3.12.0.jar.sha1 deleted file mode 100644 index 5a90da6d079..00000000000 --- a/solr/licenses/carrot2-mini-3.12.0.jar.sha1 +++ /dev/null @@ -1 +0,0 @@ -9d8b42afe43ba5c0a0c5d67208d5c919e45c3584 diff --git a/solr/licenses/carrot2-mini-3.15.0.jar.sha1 b/solr/licenses/carrot2-mini-3.15.0.jar.sha1 new file mode 100644 index 00000000000..cd87a99aaa0 --- /dev/null +++ b/solr/licenses/carrot2-mini-3.15.0.jar.sha1 @@ -0,0 +1 @@ +5d76ec388711056bfaaacc354ed04ffa6811c7b7