SOLR-2129: Provide a Solr module for dynamic metadata extraction/indexing with Apache UIMA

git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/trunk@1062604 13f79535-47bb-0310-9956-ffa450edef68
2011-01-24 01:58:00 +00:00 · 2011-01-24 01:58:00 +00:00 · 6c05d94c93
parent 68dc071064
commit 6c05d94c93
43 changed files with 4751 additions and 1 deletions
--- a/dev-tools/eclipse/dot.classpath
+++ b/dev-tools/eclipse/dot.classpath
@ -73,6 +73,10 @@
 	<classpathentry kind="src" path="solr/contrib/extraction/src/main/java"/>
 	<classpathentry kind="src" path="solr/contrib/extraction/src/test/java"/>
 	<classpathentry kind="src" path="solr/contrib/extraction/src/test/resources"/>
 	<classpathentry kind="src" path="solr/contrib/uima/src/main/java"/>
 	<classpathentry kind="src" path="solr/contrib/uima/src/main/resources"/>
 	<classpathentry kind="src" path="solr/contrib/uima/src/test/java"/>
 	<classpathentry kind="src" path="solr/contrib/uima/src/test/resources"/>
 	<classpathentry kind="lib" path="lucene/lib/ant-1.7.1.jar"/>
 	<classpathentry kind="lib" path="lucene/lib/ant-junit-1.7.1.jar"/>
 	<classpathentry kind="lib" path="lucene/lib/junit-4.7.jar"/>
@ -151,6 +155,12 @@
 	<classpathentry kind="lib" path="solr/contrib/extraction/lib/tika-core-0.8.jar"/>
 	<classpathentry kind="lib" path="solr/contrib/extraction/lib/tika-parsers-0.8.jar"/>
 	<classpathentry kind="lib" path="solr/contrib/extraction/lib/xmlbeans-2.3.0.jar"/>
 	<classpathentry kind="lib" path="solr/contrib/uima/lib/commons-digester-2.0.jar"/>
 	<classpathentry kind="lib" path="solr/contrib/uima/lib/uima-an-alchemy.jar"/>
 	<classpathentry kind="lib" path="solr/contrib/uima/lib/uima-an-calais.jar"/>
 	<classpathentry kind="lib" path="solr/contrib/uima/lib/uima-an-tagger.jar"/>
 	<classpathentry kind="lib" path="solr/contrib/uima/lib/uima-an-wst.jar"/>
 	<classpathentry kind="lib" path="solr/contrib/uima/lib/uima-core.jar"/>
 	<classpathentry kind="con" path="org.eclipse.jdt.launching.JRE_CONTAINER"/>
 	<classpathentry kind="output" path="bin"/>
 </classpath>
--- a/solr/CHANGES.txt
+++ b/solr/CHANGES.txt
@ -411,6 +411,9 @@ New Features
 * SOLR-2188: Added "maxTokenLength" argument to the factories for ClassicTokenizer,
  StandardTokenizer, and UAX29URLEmailTokenizer. (Steven Rowe)
 * SOLR-2129: Added a Solr module for dynamic metadata extraction/indexing with Apache UIMA.
  See contrib/uima/README.txt for more information.  (Tommaso Teofili via rmuir)
 Optimizations
 ----------------------
--- a/solr/build.xml
+++ b/solr/build.xml
@ -218,6 +218,7 @@
          <packageset dir="contrib/dataimporthandler/src/main/java" />
          <packageset dir="contrib/clustering/src/main/java" />
          <packageset dir="contrib/extraction/src/main/java" />
          <packageset dir="contrib/uima/src/main/java" />
          <packageset dir="contrib/analysis-extras/src/java" />
          <group title="Core" packages="org.apache.*" />
          <group title="Common" packages="org.apache.solr.common.*" />
@ -225,6 +226,7 @@
          <group title="contrib: DataImportHandler" packages="org.apache.solr.handler.dataimport*" />
          <group title="contrib: Clustering" packages="org.apache.solr.handler.clustering*" />
          <group title="contrib: Solr Cell" packages="org.apache.solr.handler.extraction*" />
          <group title="contrib: Solr UIMA" packages="org.apache.solr.uima*" />
        </sources>
      </invoke-javadoc>
    </sequential>
@ -514,6 +516,7 @@
      <fileset dir="contrib/dataimporthandler/src/main/java" />
      <fileset dir="contrib/clustering/src/main/java" />
      <fileset dir="contrib/extraction/src/main/java" />
      <fileset dir="contrib/uima/src/main/java" />
      <fileset dir="contrib/analysis-extras/src/java" />
    </clover-setup>
  </target>
@ -617,6 +620,10 @@
              basedir="contrib/clustering/src" />
    <solr-jar destfile="${dist}/apache-solr-analysis-extras-src-${version}.jar"
              basedir="contrib/analysis-extras/src" />
    <solr-jar destfile="${dist}/apache-solr-uima-src-${version}.jar"
              basedir="contrib/uima/src/main/java" >
       <fileset dir="contrib/uima/src/main/resources" />
    </solr-jar>
  </target>
  <target name="dist-javadoc" description="Creates the Solr javadoc distribution files"
@ -635,6 +642,8 @@
              basedir="${build.javadoc}/contrib-solr-cell" />
    <solr-jar destfile="${dist}/apache-solr-analysis-extras-docs-${version}.jar"
              basedir="${build.javadoc}/contrib-solr-analysis-extras" />
    <solr-jar destfile="${dist}/apache-solr-uima-docs-${version}.jar"
              basedir="${build.javadoc}/contrib-solr-uima" />
  </target>
  <!-- Creates the solr jar. -->
@ -731,7 +740,7 @@
      <tarfileset dir="."
        prefix="${fullnamever}"
        includes="LICENSE.txt NOTICE.txt *.txt *.xml lucene-libs/** lib/** src/** example/** client/** contrib/"
-        excludes="lib/README.committers.txt **/data/ **/logs/* **/classes/ **/*.sh **/bin/ src/scripts/ src/site/build/ **/target/ client/ruby/flare/ client/python contrib/**/build/ **/*.iml **/*.ipr **/*.iws contrib/clustering/example/lib/** contrib/clustering/lib/downloads/** contrib/analysis-extras/lib/**" />
+        excludes="lib/README.committers.txt **/data/ **/logs/* **/classes/ **/*.sh **/bin/ src/scripts/ src/site/build/ **/target/ client/ruby/flare/ client/python contrib/**/build/ **/*.iml **/*.ipr **/*.iws contrib/clustering/example/lib/** contrib/clustering/lib/downloads/** contrib/analysis-extras/lib/** contrib/uima/lib/**" />
      <tarfileset dir="."
        prefix="${fullnamever}"
        includes="src/test-files/solr/lib/classes/empty-file-main-lib.txt" />
@ -903,6 +912,14 @@
        </artifact-attachments>
      </m2-deploy>
      <m2-deploy pom.xml="contrib/extraction/solr-uima-pom.xml.template"
                 jar.file="${dist}/apache-solr-uima-${version}.jar">
        <artifact-attachments>
          <attach file="${dist}/apache-solr-uima-src-${version}.jar" classifier="sources"/>
          <attach file="${dist}/apache-solr-uima-docs-${version}.jar" classifier="javadoc"/>
        </artifact-attachments>
      </m2-deploy>
      <m2-deploy pom.xml="src/pom.xml"
                 jar.file="${dist}/apache-solr-core-${version}.jar">
        <artifact-attachments>
@ -952,6 +969,8 @@
      <fileset dir="contrib/extraction/src/test/java"/>
      <fileset dir="contrib/analysis-extras/src/test"/>
      <fileset dir="contrib/analysis-extras/src/test"/>
      <fileset dir="contrib/uima/src/main/java"/>
      <fileset dir="contrib/uima/src/test/java"/>
    </rat:report>
  </target>
--- a/solr/contrib/uima/CHANGES.txt
+++ b/solr/contrib/uima/CHANGES.txt
@ -0,0 +1,17 @@
 Apache Solr UIMA Metadata Extraction Library
                            Release Notes
 This file describes changes to the Solr UIMA (contrib/uima) module. See SOLR-2129 for details.
 Introduction
 ------------
 This module is intended to be used while indexing documents.
 Its purpose is to provide additional on the fly automatically generated fields to the Solr index.
 Such fields could be language, concepts, keywords, sentences, named entities, etc.
 UIMA Dependency
 ---------------
 uima-core, OpenCalaisAnnotator, WhitespaceTokenizer, HMMTagger, AlchemyAPIAnnotator
 Current Version:  2.3.1-SNAPSHOT rev. 999276
 $Id$
--- a/solr/contrib/uima/README.txt
+++ b/solr/contrib/uima/README.txt
@ -0,0 +1,60 @@
 Getting Started
 ---------------
 To start using Solr UIMA Metadata Extraction Library you should go through the following configuration steps:
 1. copy generated solr-uima jar and its libs (under contrib/uima/lib) inside a Solr libraries directory.
 2. modify your schema.xml adding the fields you want to be hold metadata specifying proper values for type, indexed, stored and multiValued options:
 3. for example you could specify the following
  <field name="language" type="string" indexed="true" stored="true" required="false"/>
  <field name="concept" type="string" indexed="true" stored="true" multiValued="true" required="false"/>
  <field name="sentence" type="text" indexed="true" stored="true" multiValued="true" required="false" />
 4. modify your solrconfig.xml adding the following snippet:
  <uimaConfig>
    <runtimeParameters>
      <keyword_apikey>VALID_ALCHEMYAPI_KEY</keyword_apikey>
      <concept_apikey>VALID_ALCHEMYAPI_KEY</concept_apikey>
      <lang_apikey>VALID_ALCHEMYAPI_KEY</lang_apikey>
      <cat_apikey>VALID_ALCHEMYAPI_KEY</cat_apikey>
      <entities_apikey>VALID_ALCHEMYAPI_KEY</entities_apikey>
      <oc_licenseID>VALID_OPENCALAIS_KEY</oc_licenseID>
    </runtimeParameters>
    <analysisEngine>/org/apache/uima/desc/OverridingParamsExtServicesAE.xml</analysisEngine>
    <analyzeFields merge="false">text</analyzeFields>
    <fieldMapping>
      <type name="org.apache.uima.alchemy.ts.concept.ConceptFS">
       <map feature="text" field="concept"/>
      </type>
      <type name="org.apache.uima.alchemy.ts.language.LanguageFS">
       <map feature="language" field="language"/>
      </type>
      <type name="org.apache.uima.SentenceAnnotation">
        <map feature="coveredText" field="sentence"/>
      </type>
    </fieldMapping>
  </uimaConfig>
 5. the analysisEngine tag must contain an AE descriptor inside the specified path in the classpath
 6. the analyzeFields tag must contain the input fields that need to be analyzed by UIMA,
   if merge=true then their content will be merged and analyzed only once
 7. field mapping describes which features of which types should go in a field
 8. define in your solrconfig.xml an UpdateRequestProcessorChain as following:
  <updateRequestProcessorChain name="uima">
    <processor class="org.apache.solr.uima.processor.UIMAProcessorFactory"/>
    <processor class="solr.LogUpdateProcessorFactory" />
    <processor class="solr.RunUpdateProcessorFactory" />
  </updateRequestProcessorChain>
 9. in your solrconfig.xml replace the existing default (<requestHandler name="/update"...)  or create a new UpdateRequestHandler with the following:
  <requestHandler name="/update" class="solr.XmlUpdateRequestHandler">
    <lst name="defaults">
      <str name="update.processor">uima</str>
    </lst>
  </requestHandler>
 Once you're done with the configuration you can index documents which will be automatically enriched with the specified fields
--- a/solr/contrib/uima/build.xml
+++ b/solr/contrib/uima/build.xml
@ -0,0 +1,189 @@
 <?xml version="1.0"?>
 <!--
    Licensed to the Apache Software Foundation (ASF) under one or more
    contributor license agreements.  See the NOTICE file distributed with
    this work for additional information regarding copyright ownership.
    The ASF licenses this file to You under the Apache License, Version 2.0
    the "License"); you may not use this file except in compliance with
    the License.  You may obtain a copy of the License at
        http://www.apache.org/licenses/LICENSE-2.0
    Unless required by applicable law or agreed to in writing, software
    distributed under the License is distributed on an "AS IS" BASIS,
    WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
    See the License for the specific language governing permissions and
    limitations under the License.
 -->
 <project name="solr-uima" default="build">
  <property name="solr-path" value="../.." />
  <import file="../../common-build.xml"/>
  <description>
    Solr Integration with UIMA for extracting metadata from arbitrary (text) fields and enrich document with features extracted from UIMA types (language, sentences, concepts, named entities, etc.)
  </description>
  <path id="common.classpath">
    <pathelement location="${solr-path}/build/solr" />
    <pathelement location="${solr-path}/build/solrj" />
    <fileset dir="lib" includes="*.jar"/>
    <fileset dir="${solr-path}/lib" includes="*.jar"/>
    <path refid="lucene.classpath"/>
    <pathelement location="${basedir}/src/main/resources" />    
  </path>
  <path id="test.classpath">
    <path refid="common.classpath" />
    <pathelement path="${dest}/classes" />
    <pathelement path="${dest}/test-classes" />
    <pathelement location="${solr-path}/build/tests"/> <!-- include solr test code -->
    <pathelement location="${solr-path}/../lucene/build/classes/test" />  <!-- include some lucene test code -->
    <pathelement path="${java.class.path}"/>
  </path>
  <target name="clean">
    <delete failonerror="false" dir="${dest}"/>
  </target>
  <target name="init">
    <mkdir dir="${dest}/classes"/>
    <mkdir dir="${build.javadoc}" />
    <subant target="compileTests">
      <fileset dir="${solr-path}" includes="build.xml"/>
    </subant>
    <subant target="make-manifest">
      <fileset dir="${solr-path}" includes="build.xml"/>
    </subant>
  </target>
  <target name="compile" depends="init">
    <solr-javac destdir="${dest}/classes"
    classpathref="common.classpath">
      <src path="src/main/java" />
    </solr-javac>
  </target>
  <target name="build" depends="compile">
    <solr-jar destfile="${dest}/${fullnamever}.jar" basedir="${dest}/classes"
              manifest="../../${dest}/META-INF/MANIFEST.MF">
      <fileset dir="src/main/resources" />
    </solr-jar>
  </target>
  <target name="compileTests" depends="compile">
  	<solr-javac destdir="${dest}/test-classes"
  	                classpathref="test.classpath">
  	  <src path="src/test/java" />
  	</solr-javac>
        <copy todir="${dest}/test-classes">
          <fileset dir="src/test/resources" excludes="**/*.java"/>
        </copy>
  </target>
  <property name="tempDir" value="${junit.output.dir}/temp" />
  <target name="test" depends="compileTests">
  	<mkdir dir="${junit.output.dir}"/>
    <!-- <mkdir dir="@{tempDir}/@{pattern}"/> 
       This is very loud and obnoxious. abuse touch instead for a "quiet" mkdir
    -->
  	<touch file="${tempDir}/quiet.ant" verbose="false" mkdirs="true"/>
    <condition property="runall">
      <not>
        <or>
          <isset property="testcase"/>
          <isset property="testpackage"/>
          <isset property="testpackageroot"/>
        </or>
      </not>
    </condition>    
  	<junit printsummary="no"
           haltonfailure="no"
           maxmemory="512M"
           errorProperty="tests.failed"
           failureProperty="tests.failed"
           dir="${tempDir}"
           tempdir="${tempDir}"
           forkmode="perBatch"
           >
      <sysproperty key="java.util.logging.config.file" value="${common-solr.dir}/testlogging.properties"/>
      <sysproperty key="tests.luceneMatchVersion" value="${tests.luceneMatchVersion}"/>
      <sysproperty key="tests.codec" value="${tests.codec}"/>
      <sysproperty key="tests.locale" value="${tests.locale}"/>
      <sysproperty key="tests.timezone" value="${tests.timezone}"/>
      <sysproperty key="tests.multiplier" value="${tests.multiplier}"/>
      <sysproperty key="tests.iter" value="${tests.iter}"/>
      <sysproperty key="tests.seed" value="${tests.seed}"/>
      <sysproperty key="jetty.insecurerandom" value="1"/>
      <sysproperty key="tempDir" file="${tempDir}"/>
      <sysproperty key="testmethod" value="${testmethod}"/>
      <jvmarg line="${args}"/>
      <formatter classname="${junit.details.formatter}" usefile="false" if="junit.details"/>
      <classpath refid="test.classpath"/>
      <assertions>
        <enable package="org.apache.lucene"/>
        <enable package="org.apache.solr"/>
      </assertions>
      <formatter type="${junit.formatter}"/>
      <batchtest fork="yes" todir="${junit.output.dir}" if="runall">
        <fileset dir="src/test/java" includes="${junit.includes}"/>
      </batchtest>
      <batchtest fork="yes" todir="${junit.output.dir}" if="testcase">
        <fileset dir="src/test/java" includes="**/${testcase}.java"/>
      </batchtest>
      <batchtest fork="yes" todir="${junit.output.dir}" if="testpackage">
        <fileset dir="src/test/java" includes="**/${testpackage}/**/Test*.java,**/${testpackage}/**/*Test.java"/>
      </batchtest>
      <batchtest fork="yes" todir="${junit.output.dir}" if="testpackageroot">
        <fileset dir="src/test/java" includes="**/${testpackageroot}/Test*.java,**/${testpackageroot}/*Test.java"/>
      </batchtest>
    </junit>
    <fail if="tests.failed">Tests failed!</fail>
  </target>
  <target name="test-reports"
          description="Generates HTML test reports.">
    <mkdir dir="${junit.reports}"/>
    <junitreport todir="${junit.output.dir}">
      <fileset dir="${junit.output.dir}">
        <include name="TEST-*.xml"/>
      </fileset>
      <report format="frames" todir="${junit.reports}"/>
    </junitreport>
  </target>
  <target name="dist" depends="build">
    <copy file="build/${fullnamever}.jar" todir="${solr-path}/dist"/>
  </target>
  <target name="example" depends="build">
    <!-- :NOOP: this use to copy libs but now we can refer to them by path -->
  </target>
  <target name="javadoc">
   	<sequential>
      <mkdir dir="${build.javadoc}/contrib-${name}"/>
      <path id="javadoc.classpath">
        <path refid="common.classpath"/>
      </path>
      <invoke-javadoc
        destdir="${build.javadoc}/contrib-${name}"
      	title="${Name} ${version} contrib-${fullnamever} API">
        <sources>
          <packageset dir="src/main/java"/>
        </sources>
      </invoke-javadoc>
    </sequential>
  </target>
 </project>
--- a/solr/contrib/uima/lib/commons-digester-2.0.jar
+++ b/solr/contrib/uima/lib/commons-digester-2.0.jar
@ -0,0 +1,2 @@
 AnyObjectId[9c8bd13a2002a9ff5b35b873b9f111d5281ad201] was removed in git history.
 Apache SVN contains full history.
--- a/solr/contrib/uima/lib/commons-lang-2.4.jar
+++ b/solr/contrib/uima/lib/commons-lang-2.4.jar
@ -0,0 +1,2 @@
 AnyObjectId[532939ecab6b77ccb77af3635c55ff9752b70ab7] was removed in git history.
 Apache SVN contains full history.
--- a/solr/contrib/uima/lib/uima-an-alchemy.jar
+++ b/solr/contrib/uima/lib/uima-an-alchemy.jar
@ -0,0 +1,2 @@
 AnyObjectId[33165678da937e03cb069449b40f1cf690beda0a] was removed in git history.
 Apache SVN contains full history.
--- a/solr/contrib/uima/lib/uima-an-calais.jar
+++ b/solr/contrib/uima/lib/uima-an-calais.jar
@ -0,0 +1,2 @@
 AnyObjectId[5dfc32bce5e444a9bb3387d664485f7bfdc438ad] was removed in git history.
 Apache SVN contains full history.
--- a/solr/contrib/uima/lib/uima-an-tagger.jar
+++ b/solr/contrib/uima/lib/uima-an-tagger.jar
@ -0,0 +1,2 @@
 AnyObjectId[bf90c19d2c1f77e300b94363385841ec1225b4b9] was removed in git history.
 Apache SVN contains full history.
--- a/solr/contrib/uima/lib/uima-an-wst.jar
+++ b/solr/contrib/uima/lib/uima-an-wst.jar
@ -0,0 +1,2 @@
 AnyObjectId[9518da64cdf5d378273ab40a06823a7768f18ece] was removed in git history.
 Apache SVN contains full history.
--- a/solr/contrib/uima/lib/uima-core.jar
+++ b/solr/contrib/uima/lib/uima-core.jar
@ -0,0 +1,2 @@
 AnyObjectId[72991424bdfe4776f66feab7ff4e8564f12d2659] was removed in git history.
 Apache SVN contains full history.
--- a/solr/contrib/uima/solr-uima-pom.xml.template
+++ b/solr/contrib/uima/solr-uima-pom.xml.template
@ -0,0 +1,115 @@
 <project xmlns="http://maven.apache.org/POM/4.0.0" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
  xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/maven-v4_0_0.xsd">
  <!--
    Licensed to the Apache Software Foundation (ASF) under one
    or more contributor license agreements.  See the NOTICE file
    distributed with this work for additional information
    regarding copyright ownership.  The ASF licenses this file
    to you under the Apache License, Version 2.0 (the
    "License"); you may not use this file except in compliance
    with the License.  You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0
    Unless required by applicable law or agreed to in writing,
    software distributed under the License is distributed on an
    "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
    KIND, either express or implied.  See the License for the
    specific language governing permissions and limitations
    under the License.
  -->
  <modelVersion>4.0.0</modelVersion>
  <groupId>org.apache.solr</groupId>
  <artifactId>solr-uima</artifactId>
  <version>0.0.2-SNAPSHOT</version>
  <name>Solr - UIMA integration</name>
  <properties>
    <uimaVersion>2.3.1-SNAPSHOT</uimaVersion>
  </properties>
  <dependencies>
    <dependency>
      <groupId>org.apache.solr</groupId>
      <artifactId>solr-core</artifactId>
      <version>1.4.1</version>
    </dependency>
    <dependency>
      <groupId>org.apache.uima</groupId>
      <artifactId>uimaj-core</artifactId>
      <version>${uimaVersion}</version>
    </dependency>
    <dependency>
      <groupId>org.apache.uima</groupId>
      <artifactId>alchemy-annotator</artifactId>
      <version>${uimaVersion}</version>
    </dependency>
    <dependency>
      <groupId>org.apache.uima</groupId>
      <artifactId>OpenCalaisAnnotator</artifactId>
      <version>${uimaVersion}</version>
    </dependency>
    <dependency>
      <groupId>junit</groupId>
      <artifactId>junit</artifactId>
      <version>4.7</version>
      <type>jar</type>
      <scope>test</scope>
    </dependency>
    <dependency>
      <groupId>org.slf4j</groupId>
      <artifactId>slf4j-simple</artifactId>
      <version>1.5.5</version>
    </dependency>
    <dependency>
      <groupId>org.apache.uima</groupId>
      <artifactId>WhitespaceTokenizer</artifactId>
      <version>${uimaVersion}</version>
    </dependency>
    <dependency>
      <groupId>org.apache.uima</groupId>
      <artifactId>Tagger</artifactId>
      <version>${uimaVersion}</version>
    </dependency>
  </dependencies>
  <build>
    <pluginManagement>
      <plugins>
        <plugin>
          <groupId>com.googlecode.maven-gcu-plugin</groupId>
          <artifactId>maven-gcu-plugin</artifactId>
          <version>1.0</version>
        </plugin>
      </plugins>
    </pluginManagement>
    <plugins>
      <plugin>
        <groupId>org.apache.maven.plugins</groupId>
        <artifactId>maven-compiler-plugin</artifactId>
        <version>2.3.1</version>
        <configuration>
          <source>1.5</source>
          <target>1.5</target>
        </configuration>
      </plugin>
      <plugin>
        <groupId>com.googlecode.maven-gcu-plugin</groupId>
        <artifactId>maven-gcu-plugin</artifactId>
        <version>1.0</version>
        <configuration>
          <serverId>googlecode</serverId>
          <failsOnError>true</failsOnError>
          <projectName>${project.artifactId}</projectName>
          <uploads>
            <upload>
              <file>${project.build.directory}/${project.artifactId}-${project.version}.${project.packaging}</file>
              <summary>${project.name} sources bundle ${project.version}</summary>
              <labels>
                <label>Featured</label>
                <label>Type-Archive</label>
              </labels>
            </upload>
          </uploads>
        </configuration>
      </plugin>
    </plugins>
  </build>
 </project>
--- a/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/SolrUIMAConfiguration.java
+++ b/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/SolrUIMAConfiguration.java
@ -0,0 +1,69 @@
 package org.apache.solr.uima.processor;
 /**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 import java.util.Map;
 /**
 * Configuration holding all the configurable parameters for calling UIMA inside Solr
 * 
 * @version $Id$
 */
 public class SolrUIMAConfiguration {
  private String[] fieldsToAnalyze;
  private boolean fieldsMerging;
  private Map<String, Map<String, String>> typesFeaturesFieldsMapping;
  private String aePath;
  private Map<String, String> runtimeParameters;
  public SolrUIMAConfiguration(String aePath, String[] fieldsToAnalyze, boolean fieldsMerging,
          Map<String, Map<String, String>> typesFeaturesFieldsMapping,
          Map<String, String> runtimeParameters) {
    this.aePath = aePath;
    this.fieldsToAnalyze = fieldsToAnalyze;
    this.fieldsMerging = fieldsMerging;
    this.runtimeParameters = runtimeParameters;
    this.typesFeaturesFieldsMapping = typesFeaturesFieldsMapping;
  }
  public String[] getFieldsToAnalyze() {
    return fieldsToAnalyze;
  }
  public boolean isFieldsMerging() {
    return fieldsMerging;
  }
  public Map<String, Map<String, String>> getTypesFeaturesFieldsMapping() {
    return typesFeaturesFieldsMapping;
  }
  public String getAePath() {
    return aePath;
  }
  public Map<String, String> getRuntimeParameters() {
    return runtimeParameters;
  }
 }
--- a/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/SolrUIMAConfigurationReader.java
+++ b/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/SolrUIMAConfigurationReader.java
@ -0,0 +1,125 @@
 package org.apache.solr.uima.processor;
 /**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 import java.util.HashMap;
 import java.util.Map;
 import org.apache.solr.core.SolrConfig;
 import org.w3c.dom.Node;
 import org.w3c.dom.NodeList;
 /**
 * Read configuration for Solr-UIMA integration
 * 
 * @version $Id$
 * 
 */
 public class SolrUIMAConfigurationReader {
  private static final String AE_RUNTIME_PARAMETERS_NODE_PATH = "/config/uimaConfig/runtimeParameters";
  private static final String FIELD_MAPPING_NODE_PATH = "/config/uimaConfig/fieldMapping";
  private static final String ANALYZE_FIELDS_NODE_PATH = "/config/uimaConfig/analyzeFields";
  private static final String ANALYSIS_ENGINE_NODE_PATH = "/config/uimaConfig/analysisEngine";
  private SolrConfig solrConfig;
  public SolrUIMAConfigurationReader(SolrConfig solrConfig) {
    this.solrConfig = solrConfig;
  }
  public SolrUIMAConfiguration readSolrUIMAConfiguration() {
    return new SolrUIMAConfiguration(readAEPath(), readFieldsToAnalyze(), readFieldsMerging(),
            readTypesFeaturesFieldsMapping(), readAEOverridingParameters());
  }
  private String readAEPath() {
    return solrConfig.getNode(ANALYSIS_ENGINE_NODE_PATH, true).getTextContent();
  }
  private String[] readFieldsToAnalyze() {
    Node analyzeFieldsNode = solrConfig.getNode(ANALYZE_FIELDS_NODE_PATH, true);
    return analyzeFieldsNode.getTextContent().split(",");
  }
  private boolean readFieldsMerging() {
    Node analyzeFieldsNode = solrConfig.getNode(ANALYZE_FIELDS_NODE_PATH, true);
    Node mergeNode = analyzeFieldsNode.getAttributes().getNamedItem("merge");
    return Boolean.valueOf(mergeNode.getNodeValue());
  }
  private Map<String, Map<String, String>> readTypesFeaturesFieldsMapping() {
    Map<String, Map<String, String>> map = new HashMap<String, Map<String, String>>();
    Node fieldMappingNode = solrConfig.getNode(FIELD_MAPPING_NODE_PATH, true);
    /* iterate over UIMA types */
    if (fieldMappingNode.hasChildNodes()) {
      NodeList typeNodes = fieldMappingNode.getChildNodes();
      for (int i = 0; i < typeNodes.getLength(); i++) {
        /* <type> node */
        Node typeNode = typeNodes.item(i);
        if (typeNode.getNodeType() != Node.TEXT_NODE) {
          Node typeNameAttribute = typeNode.getAttributes().getNamedItem("name");
          /* get a UIMA typename */
          String typeName = typeNameAttribute.getNodeValue();
          /* create entry for UIMA type */
          map.put(typeName, new HashMap<String, String>());
          if (typeNode.hasChildNodes()) {
            /* iterate over features */
            NodeList featuresNodeList = typeNode.getChildNodes();
            for (int j = 0; j < featuresNodeList.getLength(); j++) {
              Node mappingNode = featuresNodeList.item(j);
              if (mappingNode.getNodeType() != Node.TEXT_NODE) {
                /* get field name */
                Node fieldNameNode = mappingNode.getAttributes().getNamedItem("field");
                String mappedFieldName = fieldNameNode.getNodeValue();
                /* get feature name */
                Node featureNameNode = mappingNode.getAttributes().getNamedItem("feature");
                String featureName = featureNameNode.getNodeValue();
                /* map the feature to the field for the specified type */
                map.get(typeName).put(featureName, mappedFieldName);
              }
            }
          }
        }
      }
    }
    return map;
  }
  private Map<String, String> readAEOverridingParameters() {
    Map<String, String> runtimeParameters = new HashMap<String, String>();
    Node uimaConfigNode = solrConfig.getNode(AE_RUNTIME_PARAMETERS_NODE_PATH, true);
    if (uimaConfigNode.hasChildNodes()) {
      NodeList overridingNodes = uimaConfigNode.getChildNodes();
      for (int i = 0; i < overridingNodes.getLength(); i++) {
        Node overridingNode = overridingNodes.item(i);
        if (overridingNode.getNodeType() != Node.TEXT_NODE) {
          runtimeParameters.put(overridingNode.getNodeName(), overridingNode.getTextContent());
        }
      }
    }
    return runtimeParameters;
  }
 }
--- a/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/UIMAToSolrMapper.java
+++ b/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/UIMAToSolrMapper.java
@ -0,0 +1,83 @@
 package org.apache.solr.uima.processor;
 /**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 import java.util.Map;
 import org.apache.solr.common.SolrInputDocument;
 import org.apache.uima.cas.FSIterator;
 import org.apache.uima.cas.FeatureStructure;
 import org.apache.uima.cas.Type;
 import org.apache.uima.jcas.JCas;
 import org.apache.uima.jcas.tcas.Annotation;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 /**
 * Map UIMA types and features over fields of a Solr document
 * 
 * @version $Id$
 */
 public class UIMAToSolrMapper {
  private final Logger log = LoggerFactory.getLogger(UIMAToSolrMapper.class);
  private SolrInputDocument document;
  private JCas cas;
  public UIMAToSolrMapper(SolrInputDocument document, JCas cas) {
    this.document = document;
    this.cas = cas;
  }
  /**
   * map features of a certain UIMA type to corresponding Solr fields based on the mapping
   * 
   * @param typeName
   *          name of UIMA type to map
   * @param featureFieldsmapping
   */
  public void map(String typeName, Map<String, String> featureFieldsmapping) {
    try {
      FeatureStructure fsMock = (FeatureStructure) Class.forName(typeName).getConstructor(
              JCas.class).newInstance(cas);
      Type type = fsMock.getType();
      for (FSIterator<FeatureStructure> iterator = cas.getFSIndexRepository().getAllIndexedFS(type); iterator
              .hasNext();) {
        FeatureStructure fs = iterator.next();
        for (String featureName : featureFieldsmapping.keySet()) {
          String fieldName = featureFieldsmapping.get(featureName);
          log.info(new StringBuffer("mapping ").append(typeName).append("@").append(featureName)
                  .append(" to ").append(fieldName).toString());
          String featureValue = null;
          if (fs instanceof Annotation && "coveredText".equals(featureName)) {
            featureValue = ((Annotation) fs).getCoveredText();
          } else {
            featureValue = fs.getFeatureValueAsString(type.getFeatureByBaseName(featureName));
          }
          log.info(new StringBuffer("writing ").append(featureValue).append(" in ").append(
                  fieldName).toString());
          document.addField(fieldName, featureValue, 1.0f);
        }
      }
    } catch (Exception e) {
      log.error(e.getLocalizedMessage());
    }
  }
 }
--- a/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/UIMAUpdateRequestProcessor.java
+++ b/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/UIMAUpdateRequestProcessor.java
@ -0,0 +1,126 @@
 package org.apache.solr.uima.processor;
 /**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 import java.io.IOException;
 import java.util.Map;
 import org.apache.solr.common.SolrInputDocument;
 import org.apache.solr.core.SolrCore;
 import org.apache.solr.uima.processor.ae.AEProvider;
 import org.apache.solr.uima.processor.ae.AEProviderFactory;
 import org.apache.solr.update.AddUpdateCommand;
 import org.apache.solr.update.processor.UpdateRequestProcessor;
 import org.apache.uima.UIMAException;
 import org.apache.uima.analysis_engine.AnalysisEngine;
 import org.apache.uima.analysis_engine.AnalysisEngineProcessException;
 import org.apache.uima.jcas.JCas;
 import org.apache.uima.resource.ResourceInitializationException;
 /**
 * Update document(s) to be indexed with UIMA extracted information
 * 
 * @version $Id$
 */
 public class UIMAUpdateRequestProcessor extends UpdateRequestProcessor {
  private SolrUIMAConfiguration solrUIMAConfiguration;
  private AEProvider aeProvider;
  public UIMAUpdateRequestProcessor(UpdateRequestProcessor next, SolrCore solrCore) {
    super(next);
    initialize(solrCore);
  }
  private void initialize(SolrCore solrCore) {
    SolrUIMAConfigurationReader uimaConfigurationReader = new SolrUIMAConfigurationReader(solrCore
            .getSolrConfig());
    solrUIMAConfiguration = uimaConfigurationReader.readSolrUIMAConfiguration();
    aeProvider = AEProviderFactory.getInstance().getAEProvider(solrCore.getName(),
            solrUIMAConfiguration.getAePath(), solrUIMAConfiguration.getRuntimeParameters());
  }
  public void processAdd(AddUpdateCommand cmd) throws IOException {
    try {
      /* get Solr document */
      SolrInputDocument solrInputDocument = cmd.getSolrInputDocument();
      /* get the fields to analyze */
      for (String text : getTextsToAnalyze(solrInputDocument)) {
        if (text != null && !"".equals(text)) {
          /* process the text value */
          JCas jcas = processText(text);
          UIMAToSolrMapper uimaToSolrMapper = new UIMAToSolrMapper(solrInputDocument, jcas);
          /* get field mapping from config */
          Map<String, Map<String, String>> typesAndFeaturesFieldsMap = solrUIMAConfiguration
                  .getTypesFeaturesFieldsMapping();
          /* map type features on fields */
          for (String typeFQN : typesAndFeaturesFieldsMap.keySet()) {
            uimaToSolrMapper.map(typeFQN, typesAndFeaturesFieldsMap.get(typeFQN));
          }
        }
      }
    } catch (UIMAException e) {
      throw new RuntimeException(e);
    }
    super.processAdd(cmd);
  }
  /*
   * get the texts to analyze from the corresponding fields
   */
  private String[] getTextsToAnalyze(SolrInputDocument solrInputDocument) {
    String[] fieldsToAnalyze = solrUIMAConfiguration.getFieldsToAnalyze();
    boolean merge = solrUIMAConfiguration.isFieldsMerging();
    String[] textVals = null;
    if (merge) {
      StringBuilder unifiedText = new StringBuilder("");
      for (int i = 0; i < fieldsToAnalyze.length; i++) {
        unifiedText.append(String.valueOf(solrInputDocument.getFieldValue(fieldsToAnalyze[i])));
      }
      textVals = new String[1];
      textVals[0] = unifiedText.toString();
    } else {
      textVals = new String[fieldsToAnalyze.length];
      for (int i = 0; i < fieldsToAnalyze.length; i++) {
        textVals[i] = String.valueOf(solrInputDocument.getFieldValue(fieldsToAnalyze[i]));
      }
    }
    return textVals;
  }
  /* process a field value executing UIMA the CAS containing it as document text */
  private JCas processText(String textFieldValue) throws ResourceInitializationException,
          AnalysisEngineProcessException {
    log.info(new StringBuffer("Analazying text").toString());
    /* get the UIMA analysis engine */
    AnalysisEngine ae = aeProvider.getAE();
    /* create a JCas which contain the text to analyze */
    JCas jcas = ae.newJCas();
    jcas.setDocumentText(textFieldValue);
    /* perform analysis on text field */
    ae.process(jcas);
    log.info(new StringBuilder("Text processing completed").toString());
    return jcas;
  }
 }
--- a/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/UIMAUpdateRequestProcessorFactory.java
+++ b/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/UIMAUpdateRequestProcessorFactory.java
@ -0,0 +1,37 @@
 package org.apache.solr.uima.processor;
 /**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 import org.apache.solr.request.SolrQueryRequest;
 import org.apache.solr.response.SolrQueryResponse;
 import org.apache.solr.update.processor.UpdateRequestProcessor;
 import org.apache.solr.update.processor.UpdateRequestProcessorFactory;
 /**
 * Factory for {@link UIMAUpdateRequestProcessor}
 * 
 * @version $Id$
 */
 public class UIMAUpdateRequestProcessorFactory extends UpdateRequestProcessorFactory {
  public UpdateRequestProcessor getInstance(SolrQueryRequest req, SolrQueryResponse rsp,
          UpdateRequestProcessor next) {
    return new UIMAUpdateRequestProcessor(next, req.getCore());
  }
 }
--- a/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/ae/AEProvider.java
+++ b/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/ae/AEProvider.java
@ -0,0 +1,32 @@
 package org.apache.solr.uima.processor.ae;
 /**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 import org.apache.uima.analysis_engine.AnalysisEngine;
 import org.apache.uima.resource.ResourceInitializationException;
 /**
 * provide an Apache UIMA {@link AnalysisEngine}
 * 
 * @version $Id$
 */
 public interface AEProvider {
  public AnalysisEngine getAE() throws ResourceInitializationException;
 }
--- a/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/ae/AEProviderFactory.java
+++ b/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/ae/AEProviderFactory.java
@ -0,0 +1,53 @@
 package org.apache.solr.uima.processor.ae;
 /**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 import java.util.HashMap;
 import java.util.Map;
 /**
 * Singleton factory class responsible of {@link AEProvider}s' creation
 * 
 * @version $Id$
 */
 public class AEProviderFactory {
  private static AEProviderFactory instance;
  private Map<String, AEProvider> providerCache = new HashMap<String, AEProvider>();
  private AEProviderFactory() {
    // Singleton
  }
  public static AEProviderFactory getInstance() {
    if (instance == null) {
      instance = new AEProviderFactory();
    }
    return instance;
  }
  public synchronized AEProvider getAEProvider(String core, String aePath,
          Map<String, String> runtimeParameters) {
    String key = new StringBuilder(core).append(aePath).toString();
    if (providerCache.get(key) == null) {
      providerCache.put(key, new OverridingParamsAEProvider(aePath, runtimeParameters));
    }
    return providerCache.get(key);
  }
 }
--- a/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/ae/OverridingParamsAEProvider.java
+++ b/solr/contrib/uima/src/main/java/org/apache/solr/uima/processor/ae/OverridingParamsAEProvider.java
@ -0,0 +1,89 @@
 package org.apache.solr.uima.processor.ae;
 /**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 import java.net.URL;
 import java.util.Map;
 import org.apache.uima.UIMAFramework;
 import org.apache.uima.analysis_engine.AnalysisEngine;
 import org.apache.uima.analysis_engine.AnalysisEngineDescription;
 import org.apache.uima.resource.ResourceInitializationException;
 import org.apache.uima.util.XMLInputSource;
 import org.slf4j.Logger;
 import org.slf4j.LoggerFactory;
 /**
 * {@link AEProvider} implementation that creates an Aggregate AE from the given path, also
 * injecting runtime parameters defined in the solrconfig.xml Solr configuration file and assigning
 * them as overriding parameters in the aggregate AE
 * 
 * @version $Id$
 */
 public class OverridingParamsAEProvider implements AEProvider {
  private static Logger log = LoggerFactory.getLogger(OverridingParamsAEProvider.class);
  private String aeFilePath;
  private AnalysisEngine cachedAE;
  private Map<String, String> runtimeParameters;
  public OverridingParamsAEProvider(String aeFilePath, Map<String, String> runtimeParameters) {
    this.aeFilePath = aeFilePath;
    this.runtimeParameters = runtimeParameters;
  }
  public synchronized AnalysisEngine getAE() throws ResourceInitializationException {
    try {
      if (cachedAE == null) {
        // get Resource Specifier from XML file
        URL url = this.getClass().getResource(aeFilePath);
        XMLInputSource in = new XMLInputSource(url);
        // get AE description
        AnalysisEngineDescription desc = UIMAFramework.getXMLParser()
                .parseAnalysisEngineDescription(in);
        /* iterate over each AE (to set runtime parameters) */
        for (String attributeName : runtimeParameters.keySet()) {
          desc.getAnalysisEngineMetaData().getConfigurationParameterSettings().setParameterValue(
                  attributeName, runtimeParameters.get(attributeName));
          log.info(new StringBuilder("setting ").append(attributeName).append(" : ").append(
                  runtimeParameters.get(attributeName)).toString());
        }
        // create AE here
        cachedAE = UIMAFramework.produceAnalysisEngine(desc);
        if (log.isDebugEnabled())
          log.debug(new StringBuilder("AE ").append(cachedAE.getAnalysisEngineMetaData().getName())
                  .append(" created from descriptor ").append(aeFilePath).toString());
      } else {
        cachedAE.reconfigure();
        if (log.isDebugEnabled())
          log.debug(new StringBuilder("AE ").append(cachedAE.getAnalysisEngineMetaData().getName())
                  .append(" at path ").append(aeFilePath).append(" reconfigured ").toString());
      }
    } catch (Exception e) {
      cachedAE = null;
      throw new ResourceInitializationException(e);
    }
    return cachedAE;
  }
 }
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/AggregateSentenceAE.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/AggregateSentenceAE.xml
@ -0,0 +1,41 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
  <primitive>false</primitive>
  <delegateAnalysisEngineSpecifiers>
    <delegateAnalysisEngine key="HmmTagger">
      <import name="HmmTagger"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="WhitespaceTokenizer">
      <import name="WhitespaceTokenizer"/>
    </delegateAnalysisEngine>
  </delegateAnalysisEngineSpecifiers>
  <analysisEngineMetaData>
    <name>AggregateSentenceAE</name>
    <description/>
    <version>1.0</version>
    <vendor/>
    <configurationParameters/>
    <configurationParameterSettings/>
    <flowConstraints>
      <fixedFlow>
        <node>WhitespaceTokenizer</node>
        <node>HmmTagger</node>
      </fixedFlow>
    </flowConstraints>
    <fsIndexCollection/>
    <capabilities>
      <capability>
        <inputs/>
        <outputs/>
        <languagesSupported/>
      </capability>
    </capabilities>
    <operationalProperties>
      <modifiesCas>true</modifiesCas>
      <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
      <outputsNewCASes>false</outputsNewCASes>
    </operationalProperties>
  </analysisEngineMetaData>
  <resourceManagerConfiguration/>
 </analysisEngineDescription>
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/ExtServicesAE.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/ExtServicesAE.xml
@ -0,0 +1,57 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
  <primitive>false</primitive>
  <delegateAnalysisEngineSpecifiers>
    <delegateAnalysisEngine key="TextConceptTaggingAEDescriptor">
      <import name="TextConceptTaggingAEDescriptor"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="TextKeywordExtractionAEDescriptor">
      <import name="TextKeywordExtractionAEDescriptor"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="OpenCalaisAnnotator">
      <import name="OpenCalaisAnnotator"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="TextCategorizationAEDescriptor">
      <import name="TextCategorizationAEDescriptor"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="TextLanguageDetectionAEDescriptor">
      <import name="TextLanguageDetectionAEDescriptor"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="TextRankedEntityExtractionAEDescriptor">
      <import name="TextRankedEntityExtractionAEDescriptor"/>
    </delegateAnalysisEngine>
  </delegateAnalysisEngineSpecifiers>
  <analysisEngineMetaData>
    <name>ExtServicesAE</name>
    <description/>
    <version>1.0</version>
    <vendor/>
    <configurationParameters/>
    <configurationParameterSettings/>
    <flowConstraints>
      <fixedFlow>
        <node>OpenCalaisAnnotator</node>
        <node>TextKeywordExtractionAEDescriptor</node>
        <node>TextLanguageDetectionAEDescriptor</node>
        <node>TextCategorizationAEDescriptor</node>
        <node>TextConceptTaggingAEDescriptor</node>
        <node>TextRankedEntityExtractionAEDescriptor</node>
      </fixedFlow>
    </flowConstraints>
    <fsIndexCollection/>
    <capabilities>
      <capability>
        <inputs/>
        <outputs/>
        <languagesSupported/>
      </capability>
    </capabilities>
    <operationalProperties>
      <modifiesCas>true</modifiesCas>
      <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
      <outputsNewCASes>false</outputsNewCASes>
    </operationalProperties>
  </analysisEngineMetaData>
  <resourceManagerConfiguration/>
 </analysisEngineDescription>
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/HmmTagger.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/HmmTagger.xml
@ -0,0 +1,121 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <!--
 	Licensed to the Apache Software Foundation (ASF) under one
 	or more contributor license agreements.  See the NOTICE file
 	distributed with this work for additional information
 	regarding copyright ownership.  The ASF licenses this file
 	to you under the Apache License, Version 2.0 (the
 	"License"); you may not use this file except in compliance
 	with the License.  You may obtain a copy of the License at
 	http://www.apache.org/licenses/LICENSE-2.0
 	Unless required by applicable law or agreed to in writing,
 	software distributed under the License is distributed on an
 	"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 	KIND, either express or implied.  See the License for the
 	specific language governing permissions and limitations
 	under the License.    
 -->
 <analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
  <primitive>true</primitive>
  <annotatorImplementationName>org.apache.uima.examples.tagger.HMMTagger</annotatorImplementationName>
  <analysisEngineMetaData>
    <name>Hidden Markov Model - Part of Speech Tagger</name>
    <description>A configuration of the HmmTaggerAnnotator that looks for
 			parts of speech of identified tokens within existing
 			Sentence and Token annotations. See also
 			WhitespaceTokenizer.xml.</description>
    <version>1.0</version>
    <vendor>The Apache Software Foundation</vendor>
    <configurationParameters>
      <configurationParameter>
        <name>NGRAM_SIZE</name>
        <type>Integer</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
    </configurationParameters>
    <configurationParameterSettings>
      <nameValuePair>
        <name>NGRAM_SIZE</name>
        <value>
          <integer>3</integer>
        </value>
      </nameValuePair>
    </configurationParameterSettings>
    <typeSystemDescription>
      <types>
        <typeDescription>
          <name>org.apache.uima.TokenAnnotation</name>
          <description>Single token annotation</description>
          <supertypeName>uima.tcas.Annotation</supertypeName>
          <features>
            <featureDescription>
              <name>posTag</name>
              <description>contains part-of-speech of a
 								corresponding token</description>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
          </features>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.SentenceAnnotation</name>
          <description>sentence annotation</description>
          <supertypeName>uima.tcas.Annotation</supertypeName>
        </typeDescription>
      </types>
    </typeSystemDescription>
    <typePriorities/>
    <fsIndexCollection/>
    <capabilities>
      <capability>
        <inputs>
          <type>org.apache.uima.TokenAnnotation</type>
          <type allAnnotatorFeatures="true">org.apache.uima.SentenceAnnotation</type>
          <feature>org.apache.uima.TokenAnnotation:end</feature>
          <feature>org.apache.uima.TokenAnnotation:begin</feature>
        </inputs>
        <outputs>
          <type>org.apache.uima.TokenAnnotation</type>
          <feature>org.apache.uima.TokenAnnotation:posTag</feature>
          <feature>org.apache.uima.TokenAnnotation:end</feature>
          <feature>org.apache.uima.TokenAnnotation:begin</feature>
        </outputs>
        <languagesSupported/>
      </capability>
    </capabilities>
    <operationalProperties>
      <modifiesCas>true</modifiesCas>
      <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
      <outputsNewCASes>false</outputsNewCASes>
    </operationalProperties>
  </analysisEngineMetaData>
  <externalResourceDependencies>
    <externalResourceDependency>
      <key>Model</key>
      <description>HMM Tagger model file</description>
      <interfaceName>org.apache.uima.examples.tagger.IModelResource</interfaceName>
      <optional>false</optional>
    </externalResourceDependency>
  </externalResourceDependencies>
  <resourceManagerConfiguration>
    <externalResources>
      <externalResource>
        <name>ModelFile</name>
        <description>HMM Tagger model file</description>
        <fileResourceSpecifier>
          <fileUrl>file:english/BrownModel.dat</fileUrl>
        </fileResourceSpecifier>
        <implementationName>org.apache.uima.examples.tagger.ModelResource</implementationName>
      </externalResource>
    </externalResources>
    <externalResourceBindings>
      <externalResourceBinding>
        <key>Model</key>
        <resourceName>ModelFile</resourceName>
      </externalResourceBinding>
    </externalResourceBindings>
  </resourceManagerConfiguration>
 </analysisEngineDescription>
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/OpenCalaisAnnotator.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/OpenCalaisAnnotator.xml
@ -0,0 +1,194 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
  <primitive>true</primitive>
  <annotatorImplementationName>org.apache.uima.annotator.calais.OpenCalaisAnnotator</annotatorImplementationName>
  <analysisEngineMetaData>
    <name>OpenCalaisAnnotator</name>
    <description/>
    <configurationParameters>
      <configurationParameter>
        <name>allowDistribution</name>
        <description/>
        <type>Boolean</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>allowSearch</name>
        <description/>
        <type>Boolean</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>submitter</name>
        <description/>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>licenseID</name>
        <description/>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
    </configurationParameters>
    <configurationParameterSettings>
      <nameValuePair>
        <name>allowDistribution</name>
        <value>
          <boolean>false</boolean>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>allowSearch</name>
        <value>
          <boolean>false</boolean>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>submitter</name>
        <value>
          <string/>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>licenseID</name>
        <value>
          <string>OC_LICENSE_ID</string>
        </value>
      </nameValuePair>
    </configurationParameterSettings>
    <typeSystemDescription>
      <types>
        <typeDescription>
          <name>org.apache.uima.calais.Person</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.Anniversary</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.City</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.Company</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.Continent</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.Country</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.Currency</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.EmailAddress</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.Facility</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.FaxNumber</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.Holiday</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.IndustryTerm</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.NaturalDisaster</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.NaturalFeature</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.Organization</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.PhoneNumber</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.ProviceOrState</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.Region</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.Technology</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.URL</name>
          <description/>
          <supertypeName>org.apache.uima.calais.BaseType</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.calais.BaseType</name>
          <description/>
          <supertypeName>uima.tcas.Annotation</supertypeName>
          <features>
            <featureDescription>
              <name>calaisType</name>
              <description>OpenCalais type</description>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
          </features>
        </typeDescription>
      </types>
    </typeSystemDescription>
    <capabilities>
      <capability>
        <inputs/>
        <outputs/>
        <languagesSupported/>
      </capability>
    </capabilities>
    <operationalProperties>
      <modifiesCas>true</modifiesCas>
      <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
      <outputsNewCASes>false</outputsNewCASes>
    </operationalProperties>
  </analysisEngineMetaData>
 </analysisEngineDescription>
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/OverridingParamsExtServicesAE.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/OverridingParamsExtServicesAE.xml
@ -0,0 +1,147 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
  <primitive>false</primitive>
  <delegateAnalysisEngineSpecifiers>
    <delegateAnalysisEngine key="TextKeywordExtractionAEDescriptor">
      <import name="TextKeywordExtractionAEDescriptor"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="TextConceptTaggingAEDescriptor">
      <import name="TextConceptTaggingAEDescriptor"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="OpenCalaisAnnotator">
      <import name="OpenCalaisAnnotator"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="TextLanguageDetectionAEDescriptor">
      <import name="TextLanguageDetectionAEDescriptor"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="TextCategorizationAEDescriptor">
      <import name="TextCategorizationAEDescriptor"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="AggregateSentenceAE">
      <import location="AggregateSentenceAE.xml"/>
    </delegateAnalysisEngine>
    <delegateAnalysisEngine key="TextRankedEntityExtractionAEDescriptor">
      <import name="TextRankedEntityExtractionAEDescriptor"/>
    </delegateAnalysisEngine>
  </delegateAnalysisEngineSpecifiers>
  <analysisEngineMetaData>
    <name>ExtServicesAE</name>
    <description/>
    <version>1.0</version>
    <vendor/>
    <configurationParameters searchStrategy="language_fallback">
      <configurationParameter>
        <name>oc_licenseID</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
        <overrides>
          <parameter>OpenCalaisAnnotator/licenseID</parameter>
        </overrides>
      </configurationParameter>
      <configurationParameter>
        <name>keyword_apikey</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
        <overrides>
          <parameter>TextKeywordExtractionAEDescriptor/apikey</parameter>
        </overrides>
      </configurationParameter>
      <configurationParameter>
        <name>concept_apikey</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
        <overrides>
          <parameter>TextConceptTaggingAEDescriptor/apikey</parameter>
        </overrides>
      </configurationParameter>
      <configurationParameter>
        <name>lang_apikey</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
        <overrides>
          <parameter>TextLanguageDetectionAEDescriptor/apikey</parameter>
        </overrides>
      </configurationParameter>
      <configurationParameter>
        <name>cat_apikey</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
        <overrides>
          <parameter>TextCategorizationAEDescriptor/apikey</parameter>
        </overrides>
      </configurationParameter>
      <configurationParameter>
        <name>entities_apikey</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
        <overrides>
          <parameter>TextRankedEntityExtractionAEDescriptor/apikey</parameter>
        </overrides>
      </configurationParameter>
    </configurationParameters>
    <configurationParameterSettings>
      <nameValuePair>
        <name>oc_licenseID</name>
        <value>
          <string>licenseid</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>keyword_apikey</name>
        <value>
          <string>apikey</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>concept_apikey</name>
        <value>
          <string>apikey</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>lang_apikey</name>
        <value>
          <string>apikey</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>cat_apikey</name>
        <value>
          <string>apikey</string>
        </value>
      </nameValuePair>
    </configurationParameterSettings>
    <flowConstraints>
      <fixedFlow>
        <node>AggregateSentenceAE</node>
        <node>OpenCalaisAnnotator</node>
        <node>TextKeywordExtractionAEDescriptor</node>
        <node>TextLanguageDetectionAEDescriptor</node>
        <node>TextCategorizationAEDescriptor</node>
        <node>TextConceptTaggingAEDescriptor</node>
        <node>TextRankedEntityExtractionAEDescriptor</node>
      </fixedFlow>
    </flowConstraints>
    <fsIndexCollection/>
    <capabilities>
      <capability>
        <inputs/>
        <outputs/>
        <languagesSupported/>
      </capability>
    </capabilities>
    <operationalProperties>
      <modifiesCas>true</modifiesCas>
      <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
      <outputsNewCASes>false</outputsNewCASes>
    </operationalProperties>
  </analysisEngineMetaData>
  <resourceManagerConfiguration/>
 </analysisEngineDescription>
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/TextCategorizationAEDescriptor.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/TextCategorizationAEDescriptor.xml
@ -0,0 +1,102 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <!--
    	Licensed to the Apache Software Foundation (ASF) under one
    	or more contributor license agreements.  See the NOTICE file
    	distributed with this work for additional information
    	regarding copyright ownership.  The ASF licenses this file
    	to you under the Apache License, Version 2.0 (the
    	"License"); you may not use this file except in compliance
    	with the License.  You may obtain a copy of the License at
    	http://www.apache.org/licenses/LICENSE-2.0
    	Unless required by applicable law or agreed to in writing,
    	software distributed under the License is distributed on an
    	"AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
    	KIND, either express or implied.  See the License for the
    	specific language governing permissions and limitations
    	under the License.
 -->
 <analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
  <primitive>true</primitive>
  <annotatorImplementationName>org.apache.uima.alchemy.annotator.TextCategorizationAnnotator</annotatorImplementationName>
  <analysisEngineMetaData>
    <name>TextCategorizationAEDescriptor</name>
    <description/>
    <version>1.0</version>
    <vendor/>
    <configurationParameters>
      <configurationParameter>
        <name>apikey</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>outputMode</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>baseUrl</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
    </configurationParameters>
    <configurationParameterSettings>
      <nameValuePair>
        <name>outputMode</name>
        <value>
          <string>xml</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>apikey</name>
        <value>
          <string>AA_API_KEY</string>
        </value>
      </nameValuePair>
    </configurationParameterSettings>
    <typeSystemDescription>
      <types>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.categorization.Category</name>
          <description/>
          <supertypeName>uima.cas.TOP</supertypeName>
          <features>
            <featureDescription>
              <name>score</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>text</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
          </features>
        </typeDescription>
      </types>
    </typeSystemDescription>
    <typePriorities/>
    <fsIndexCollection/>
    <capabilities>
      <capability>
        <inputs/>
        <outputs/>
        <languagesSupported/>
      </capability>
    </capabilities>
    <operationalProperties>
      <modifiesCas>true</modifiesCas>
      <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
      <outputsNewCASes>false</outputsNewCASes>
    </operationalProperties>
  </analysisEngineMetaData>
  <resourceManagerConfiguration/>
 </analysisEngineDescription>
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/TextConceptTaggingAEDescriptor.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/TextConceptTaggingAEDescriptor.xml
@ -0,0 +1,196 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <!--
   Licensed to the Apache Software Foundation (ASF) under one
   or more contributor license agreements.  See the NOTICE file
   distributed with this work for additional information
   regarding copyright ownership.  The ASF licenses this file
   to you under the Apache License, Version 2.0 (the
   "License"); you may not use this file except in compliance
   with the License.  You may obtain a copy of the License at
     http://www.apache.org/licenses/LICENSE-2.0
   Unless required by applicable law or agreed to in writing,
   software distributed under the License is distributed on an
   "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
   KIND, either express or implied.  See the License for the
   specific language governing permissions and limitations
   under the License.    
 -->
 <analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
  <primitive>true</primitive>
  <annotatorImplementationName>org.apache.uima.alchemy.annotator.TextConceptTaggingAnnotator</annotatorImplementationName>
  <analysisEngineMetaData>
    <name>TextConceptTaggingAEDescriptor</name>
    <description/>
    <version>1.0</version>
    <vendor/>
    <configurationParameters>
      <configurationParameter>
        <name>apikey</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>outputMode</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>linkedData</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>showSourceText</name>
        <type>Integer</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>maxRetrieve</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>url</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
    </configurationParameters>
    <configurationParameterSettings>
      <nameValuePair>
        <name>apikey</name>
        <value>
          <string/>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>outputMode</name>
        <value>
          <string>xml</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>linkedData</name>
        <value>
          <string>1</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>showSourceText</name>
        <value>
          <integer>0</integer>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>maxRetrieve</name>
        <value>
          <string>8</string>
        </value>
      </nameValuePair>
    </configurationParameterSettings>
    <typeSystemDescription>
      <types>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.concept.ConceptFS</name>
          <description>a concept tag</description>
          <supertypeName>uima.cas.TOP</supertypeName>
          <features>
            <featureDescription>
              <name>text</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>relevance</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>website</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>geo</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>dbpedia</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>yago</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>opencyc</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>freebase</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>ciaFactbook</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>census</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>geonames</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>musicBrainz</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>crunchbase</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>semanticCrunchbase</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
          </features>
        </typeDescription>
      </types>
    </typeSystemDescription>
    <typePriorities/>
    <fsIndexCollection/>
    <capabilities>
      <capability>
        <inputs/>
        <outputs/>
        <languagesSupported/>
      </capability>
    </capabilities>
    <operationalProperties>
      <modifiesCas>true</modifiesCas>
      <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
      <outputsNewCASes>false</outputsNewCASes>
    </operationalProperties>
  </analysisEngineMetaData>
  <resourceManagerConfiguration/>
 </analysisEngineDescription>
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/TextKeywordExtractionAEDescriptor.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/TextKeywordExtractionAEDescriptor.xml
@ -0,0 +1,107 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
  <primitive>true</primitive>
  <annotatorImplementationName>org.apache.uima.alchemy.annotator.TextKeywordExtractionAnnotator</annotatorImplementationName>
  <analysisEngineMetaData>
    <name>TextKeywordExtractionAEDescriptor</name>
    <description/>
    <version>1.0</version>
    <vendor/>
    <configurationParameters>
      <configurationParameter>
        <name>apikey</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>outputMode</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>baseUrl</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>url</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>maxRetrieve</name>
        <type>Integer</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>showSourceText</name>
        <type>Integer</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
    </configurationParameters>
    <configurationParameterSettings>
      <nameValuePair>
        <name>outputMode</name>
        <value>
          <string>xml</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>apikey</name>
        <value>
          <string>04490000a72fe7ec5cb3497f14e77f338c86f2fe</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>maxRetrieve</name>
        <value>
          <integer>10</integer>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>showSourceText</name>
        <value>
          <integer>0</integer>
        </value>
      </nameValuePair>
    </configurationParameterSettings>
    <typeSystemDescription>
      <types>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.keywords.KeywordFS</name>
          <description/>
          <supertypeName>uima.cas.TOP</supertypeName>
          <features>
            <featureDescription>
              <name>text</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
          </features>
        </typeDescription>
      </types>
    </typeSystemDescription>
    <typePriorities/>
    <fsIndexCollection/>
    <capabilities>
      <capability>
        <inputs/>
        <outputs/>
        <languagesSupported/>
      </capability>
    </capabilities>
    <operationalProperties>
      <modifiesCas>true</modifiesCas>
      <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
      <outputsNewCASes>false</outputsNewCASes>
    </operationalProperties>
  </analysisEngineMetaData>
  <resourceManagerConfiguration/>
 </analysisEngineDescription>
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/TextLanguageDetectionAEDescriptor.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/TextLanguageDetectionAEDescriptor.xml
@ -0,0 +1,107 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
  <primitive>true</primitive>
  <annotatorImplementationName>org.apache.uima.alchemy.annotator.TextLanguageDetectionAnnotator</annotatorImplementationName>
  <analysisEngineMetaData>
    <name>TextLanguageDetectionAEDescriptor</name>
    <description/>
    <version>1.0</version>
    <vendor/>
    <configurationParameters>
      <configurationParameter>
        <name>apikey</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>outputMode</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>url</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
    </configurationParameters>
    <configurationParameterSettings>
      <nameValuePair>
        <name>outputMode</name>
        <value>
          <string>xml</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>apikey</name>
        <value>
          <string>AA_API_KEY</string>
        </value>
      </nameValuePair>
    </configurationParameterSettings>
    <typeSystemDescription>
      <types>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.language.LanguageFS</name>
          <description/>
          <supertypeName>uima.cas.TOP</supertypeName>
          <features>
            <featureDescription>
              <name>language</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>iso6391</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>iso6392</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>iso6393</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>ethnologue</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>nativeSpeakers</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>wikipedia</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
          </features>
        </typeDescription>
      </types>
    </typeSystemDescription>
    <typePriorities/>
    <fsIndexCollection/>
    <capabilities>
      <capability>
        <inputs/>
        <outputs/>
        <languagesSupported/>
      </capability>
    </capabilities>
    <operationalProperties>
      <modifiesCas>true</modifiesCas>
      <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
      <outputsNewCASes>false</outputsNewCASes>
    </operationalProperties>
  </analysisEngineMetaData>
  <resourceManagerConfiguration/>
 </analysisEngineDescription>
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/TextRankedEntityExtractionAEDescriptor.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/TextRankedEntityExtractionAEDescriptor.xml
@ -0,0 +1,403 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <!--
      Licensed to the Apache Software Foundation (ASF) under one
      or more contributor license agreements.  See the NOTICE file
      distributed with this work for additional information
      regarding copyright ownership.  The ASF licenses this file
      to you under the Apache License, Version 2.0 (the
      "License"); you may not use this file except in compliance
      with the License.  You may obtain a copy of the License at
      http://www.apache.org/licenses/LICENSE-2.0
      Unless required by applicable law or agreed to in writing,
      software distributed under the License is distributed on an
      "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
      KIND, either express or implied.  See the License for the
      specific language governing permissions and limitations
      under the License.
 -->
 <analysisEngineDescription xmlns="http://uima.apache.org/resourceSpecifier">
  <frameworkImplementation>org.apache.uima.java</frameworkImplementation>
  <primitive>true</primitive>
  <annotatorImplementationName>org.apache.uima.alchemy.annotator.TextRankedNamedEntityExtractionAnnotator</annotatorImplementationName>
  <analysisEngineMetaData>
    <name>TextRankedEntityExtractionAEDescriptor</name>
    <description/>
    <version>1.0</version>
    <vendor/>
    <configurationParameters>
      <configurationParameter>
        <name>apikey</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>outputMode</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>disambiguate</name>
        <type>Integer</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>linkedData</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>showSourceText</name>
        <type>Integer</type>
        <multiValued>false</multiValued>
        <mandatory>true</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>baseUrl</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>url</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>coreference</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
      <configurationParameter>
        <name>quotations</name>
        <type>String</type>
        <multiValued>false</multiValued>
        <mandatory>false</mandatory>
      </configurationParameter>
    </configurationParameters>
    <configurationParameterSettings>
      <nameValuePair>
        <name>apikey</name>
        <value>
          <string/>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>outputMode</name>
        <value>
          <string>xml</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>disambiguate</name>
        <value>
          <integer>1</integer>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>linkedData</name>
        <value>
          <string>1</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>coreference</name>
        <value>
          <string>1</string>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>showSourceText</name>
        <value>
          <integer>0</integer>
        </value>
      </nameValuePair>
      <nameValuePair>
        <name>quotations</name>
        <value>
          <string>1</string>
        </value>
      </nameValuePair>
    </configurationParameterSettings>
    <typeSystemDescription>
      <imports>
        <import location="baseAlchemyTypeSystemDescriptor.xml"/>
      </imports>
      <types>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Anniversary</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Automobile</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.City</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Company</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Continent</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Country</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.EntertainmentAward</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Facility</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.FieldTerminology</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.FinancialMarketIndex</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.GeographicFeature</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.HealthCondition</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Holiday</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Movie</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.MusicGroup</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.NaturalDisaster</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Organization</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Person</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.PrintMedia</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.RadioProgram</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.RadioStation</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Region</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Sport</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.StateOrCounty</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Technology</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.TelevisionShow</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.TelevisionStation</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.OperatingSystem</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.SportingEvent</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.Drug</name>
          <description/>
          <supertypeName>org.apache.uima.alchemy.ts.entity.BaseEntity</supertypeName>
        </typeDescription>
        <typeDescription>
          <name>org.apache.uima.alchemy.ts.entity.BaseEntity</name>
          <description/>
          <supertypeName>uima.cas.TOP</supertypeName>
          <features>
            <featureDescription>
              <name>text</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>count</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>relevance</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>disambiguation</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>subType</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>website</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>geo</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>dbpedia</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>yago</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>opencyc</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>umbel</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>freebase</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>ciaFactbook</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>census</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>geonames</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>musicBrainz</name>
              <description/>
              <rangeTypeName>uima.cas.String</rangeTypeName>
            </featureDescription>
            <featureDescription>
              <name>quotations</name>
              <description/>
              <rangeTypeName>uima.cas.StringArray</rangeTypeName>
              <multipleReferencesAllowed>true</multipleReferencesAllowed>
            </featureDescription>
            <featureDescription>
              <name>occurrences</name>
              <description>A list of annotations annotating this entity</description>
              <rangeTypeName>uima.cas.FSList</rangeTypeName>
              <elementType>uima.tcas.Annotation</elementType>
            </featureDescription>
          </features>
        </typeDescription>
      </types>
    </typeSystemDescription>
    <typePriorities/>
    <fsIndexCollection/>
    <capabilities>
      <capability>
        <inputs/>
        <outputs/>
        <languagesSupported/>
      </capability>
    </capabilities>
    <operationalProperties>
      <modifiesCas>true</modifiesCas>
      <multipleDeploymentAllowed>true</multipleDeploymentAllowed>
      <outputsNewCASes>false</outputsNewCASes>
    </operationalProperties>
  </analysisEngineMetaData>
  <resourceManagerConfiguration/>
 </analysisEngineDescription>
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/WhitespaceTokenizer.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/WhitespaceTokenizer.xml
@ -0,0 +1,115 @@
 <?xml version="1.0" encoding="UTF-8" ?>
 <!--
 	***************************************************************
 	* Licensed to the Apache Software Foundation (ASF) under one
 	* or more contributor license agreements.  See the NOTICE file
 	* distributed with this work for additional information
 	* regarding copyright ownership.  The ASF licenses this file
 	* to you under the Apache License, Version 2.0 (the
 	* "License"); you may not use this file except in compliance
 	* with the License.  You may obtain a copy of the License at
 	*
 	*   http://www.apache.org/licenses/LICENSE-2.0
 	* 
 	* Unless required by applicable law or agreed to in writing,
 	* software distributed under the License is distributed on an
 	* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
 	* KIND, either express or implied.  See the License for the
 	* specific language governing permissions and limitations
 	* under the License.
 	***************************************************************
 -->
 <analysisEngineDescription
 	xmlns="http://uima.apache.org/resourceSpecifier">
 	<frameworkImplementation>
 		org.apache.uima.java
 	</frameworkImplementation>
 	<primitive>true</primitive>
 	<annotatorImplementationName>
 		org.apache.uima.annotator.WhitespaceTokenizer
 	</annotatorImplementationName>
 	<analysisEngineMetaData>
 		<name>WhitespaceTokenizer</name>
 		<description>
 			creates token and sentence annotations for whitespace
 			separated languages
 		</description>
 		<version>1.0</version>
 		<vendor>The Apache Software Foundation</vendor>
 		<configurationParameters>
 			<configurationParameter>
 				<name>SofaNames</name>
 				<description>
 					The Sofa names the annotator should work on. If no
 					names are specified, the annotator works on the
 					default sofa.
 				</description>
 				<type>String</type>
 				<multiValued>true</multiValued>
 				<mandatory>false</mandatory>
 			</configurationParameter>
 		</configurationParameters>
 		<configurationParameterSettings>
 		<!-- 
 			<nameValuePair>
 				<name>SofaNames</name>
 				<value>
 					<array>
 						<string>sofaName</string>
 					</array>
 				</value>
 			</nameValuePair>
 		-->
 		</configurationParameterSettings>
 		<typeSystemDescription>
 			<typeDescription>
 				<name>org.apache.uima.TokenAnnotation</name>
 				<description>Single token annotation</description>
 				<supertypeName>uima.tcas.Annotation</supertypeName>
 				<features>
 					<featureDescription>
 						<name>tokenType</name>
 						<description>token type</description>
 						<rangeTypeName>uima.cas.String</rangeTypeName>
 					</featureDescription>
 				</features>
 			</typeDescription>
 			<typeDescription>
 				<name>org.apache.uima.SentenceAnnotation</name>
 				<description>sentence annotation</description>
 				<supertypeName>uima.tcas.Annotation</supertypeName>
 				<features>
 				</features>
 			</typeDescription>
 		</typeSystemDescription>
 		<fsIndexes />
 		<capabilities>
 			<capability>
 				<inputs />
 				<outputs>
 					<type>org.apache.uima.TokenAnnotation</type>
 					<feature>
 						org.apache.uima.TokenAnnotation:tokentype
 					</feature>
 					<type>org.apache.uima.SentenceAnnotation</type>
 				</outputs>
 				<languagesSupported>
 					<language>x-unspecified</language>
 				</languagesSupported>
 			</capability>
 		</capabilities>
 	</analysisEngineMetaData>
 </analysisEngineDescription>
--- a/solr/contrib/uima/src/main/resources/org/apache/uima/desc/baseAlchemyTypeSystemDescriptor.xml
+++ b/solr/contrib/uima/src/main/resources/org/apache/uima/desc/baseAlchemyTypeSystemDescriptor.xml
@ -0,0 +1,41 @@
 <?xml version="1.0" encoding="UTF-8"?>
 <!--
      Licensed to the Apache Software Foundation (ASF) under one
      or more contributor license agreements.  See the NOTICE file
      distributed with this work for additional information
      regarding copyright ownership.  The ASF licenses this file
      to you under the Apache License, Version 2.0 (the
      "License"); you may not use this file except in compliance
      with the License.  You may obtain a copy of the License at
      http://www.apache.org/licenses/LICENSE-2.0
      Unless required by applicable law or agreed to in writing,
      software distributed under the License is distributed on an
      "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
      KIND, either express or implied.  See the License for the
      specific language governing permissions and limitations
      under the License.
 -->
 <typeSystemDescription xmlns="http://uima.apache.org/resourceSpecifier">
  <name>baseAlchemyTypeSystemDescriptor</name>
  <description/>
  <version>1.0</version>
  <vendor/>
  <types>
    <typeDescription>
      <name>org.apache.uima.alchemy.ts.entity.AlchemyAnnotation</name>
      <description/>
      <supertypeName>uima.tcas.Annotation</supertypeName>
      <features>
        <featureDescription>
          <name>alchemyType</name>
          <description>alchemyAPI type</description>
          <rangeTypeName>uima.cas.String</rangeTypeName>
        </featureDescription>
      </features>
    </typeDescription>
  </types>
 </typeSystemDescription>
--- a/solr/contrib/uima/src/main/resources/solr/conf/aggregate-uima-config.xml
+++ b/solr/contrib/uima/src/main/resources/solr/conf/aggregate-uima-config.xml
@ -0,0 +1,33 @@
 <?xml version="1.0" encoding="UTF-8" ?>
  <!--
    Licensed to the Apache Software Foundation (ASF) under one or more
    contributor license agreements. See the NOTICE file distributed with
    this work for additional information regarding copyright ownership.
    The ASF licenses this file to You under the Apache License, Version
    2.0 (the "License"); you may not use this file except in compliance
    with the License. You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0 Unless required by
    applicable law or agreed to in writing, software distributed under
    the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES
    OR CONDITIONS OF ANY KIND, either express or implied. See the
    License for the specific language governing permissions and
    limitations under the License.
  -->
 <uimaConfig>
  <runtimeParameters>
    <keyword_apikey>VALID_ALCHEMYAPI_KEY</keyword_apikey>
    <concept_apikey>VALID_ALCHEMYAPI_KEY</concept_apikey>
    <lang_apikey>VALID_ALCHEMYAPI_KEY</lang_apikey>
    <cat_apikey>VALID_ALCHEMYAPI_KEY</cat_apikey>
    <oc_licenseID>VALID_OPENCALAIS_KEY</oc_licenseID>
  </runtimeParameters>
  <analysisEngine>/org/apache/uima/desc/OverridingParamsExtServicesAE.xml</analysisEngine>
  <analyzeFields merge="false">text,title</analyzeFields>
  <fieldMapping>
    <type name="org.apache.uima.jcas.tcas.Annotation">
      <map feature="coveredText" field="tag"/>
    </type>
  </fieldMapping>
 </uimaConfig>
--- a/solr/contrib/uima/src/main/resources/solr/conf/uima-fields.xml
+++ b/solr/contrib/uima/src/main/resources/solr/conf/uima-fields.xml
@ -0,0 +1,9 @@
 <?xml version="1.0" encoding="UTF-8" ?>
 <fields>
  <field name="language" type="string" indexed="true" stored="true" required="false"/>
  <field name="concept" type="string" indexed="true" stored="true" multiValued="true" required="false"/>
  <field name="keyword" type="string" indexed="true" stored="true" multiValued="true" required="false"/>
  <field name="suggested_category" type="string" indexed="true" stored="true" multiValued="false" required="false"/>
  <field name="sentence" type="text" indexed="true" stored="true" multiValued="true" required="false" />
  <dynamicField name="entity*" type="text" indexed="true" stored="true" multiValued="true"/>
 </fields>
--- a/solr/contrib/uima/src/test/java/org/apache/solr/uima/processor/UIMAUpdateRequestProcessorTest.java
+++ b/solr/contrib/uima/src/test/java/org/apache/solr/uima/processor/UIMAUpdateRequestProcessorTest.java
@ -0,0 +1,137 @@
 package org.apache.solr.uima.processor;
 /**
 * Licensed to the Apache Software Foundation (ASF) under one or more
 * contributor license agreements.  See the NOTICE file distributed with
 * this work for additional information regarding copyright ownership.
 * The ASF licenses this file to You under the Apache License, Version 2.0
 * (the "License"); you may not use this file except in compliance with
 * the License.  You may obtain a copy of the License at
 *
 *     http://www.apache.org/licenses/LICENSE-2.0
 *
 * Unless required by applicable law or agreed to in writing, software
 * distributed under the License is distributed on an "AS IS" BASIS,
 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 * See the License for the specific language governing permissions and
 * limitations under the License.
 */
 import java.net.URL;
 import java.net.URLConnection;
 import java.util.ArrayList;
 import java.util.HashMap;
 import java.util.Map;
 import org.apache.solr.SolrTestCaseJ4;
 import org.apache.solr.common.params.MultiMapSolrParams;
 import org.apache.solr.common.params.SolrParams;
 import org.apache.solr.common.params.UpdateParams;
 import org.apache.solr.common.util.ContentStream;
 import org.apache.solr.common.util.ContentStreamBase;
 import org.apache.solr.core.SolrCore;
 import org.apache.solr.handler.XmlUpdateRequestHandler;
 import org.apache.solr.request.SolrQueryRequestBase;
 import org.apache.solr.response.SolrQueryResponse;
 import org.apache.solr.update.processor.UpdateRequestProcessorChain;
 import org.junit.Before;
 import org.junit.BeforeClass;
 import org.junit.Test;
 /**
 * TestCase for {@link UIMAUpdateRequestProcessor}
 * 
 * @version $Id$
 */
 public class UIMAUpdateRequestProcessorTest extends SolrTestCaseJ4 {
  @BeforeClass
  public static void beforeClass() throws Exception {
    initCore("solrconfig.xml", "schema.xml", "solr-uima");
  }
  @Before
  public void setUp() throws Exception {
    super.setUp();
    clearIndex();
    assertU(commit());
  }
  @Test
  public void testProcessorConfiguration() {
    SolrCore core = h.getCore();
    UpdateRequestProcessorChain chained = core.getUpdateProcessingChain("uima");
    assertNotNull(chained);
    UIMAUpdateRequestProcessorFactory factory = (UIMAUpdateRequestProcessorFactory) chained
            .getFactories()[0];
    assertNotNull(factory);
  }
  @Test
  public void testProcessing() throws Exception {
    // this test requires an internet connection (e.g. opencalais api)
    checkInternetConnection();
    addDoc(adoc(
            "id",
            "2312312321312",
            "text",
            "SpellCheckComponent got improvement related to recent Lucene changes. \n  "
                    + "Add support for specifying Spelling SuggestWord Comparator to Lucene spell "
                    + "checkers for SpellCheckComponent. Issue SOLR-2053 is already fixed, patch is"
                    + " attached if you need it, but it is also committed to trunk and 3_x branch."
                    + " Last Lucene European Conference has been held in Prague."));
    assertU(commit());
    assertQ(req("language:english"), "//*[@numFound='1']");
  }
  @Test
  public void testTwoUpdates() {
    // this test requires an internet connection (e.g. opencalais api)
    checkInternetConnection();
    try {
      addDoc(adoc("id", "1", "text", "The Apache Software Foundation is happy to announce "
              + "BarCampApache Sydney, Australia, the first ASF-backed event in the Southern "
              + "Hemisphere!"));
      assertU(commit());
      assertQ(req("language:english"), "//*[@numFound='1']");
      addDoc(adoc("id", "2", "text", "Taking place 11th December 2010 at the University "
              + "of Sydney's Darlington Centre, the BarCampApache \"unconference\" will be"
              + " attendee-driven, facilitated by members of the Apache community and will "
              + "focus on the Apache..."));
      assertU(commit());
      assertQ(req("language:english"), "//*[@numFound='2']");
    } catch (Exception e) {
      assumeNoException("Multiple updates on same instance didn't work", e);
    }
  }
  private void addDoc(String doc) throws Exception {
    Map<String, String[]> params = new HashMap<String, String[]>();
    params.put(UpdateParams.UPDATE_PROCESSOR, new String[] { "uima" });
    MultiMapSolrParams mmparams = new MultiMapSolrParams(params);
    SolrQueryRequestBase req = new SolrQueryRequestBase(h.getCore(), (SolrParams) mmparams) {
    };
    XmlUpdateRequestHandler handler = new XmlUpdateRequestHandler();
    handler.init(null);
    ArrayList<ContentStream> streams = new ArrayList<ContentStream>(2);
    streams.add(new ContentStreamBase.StringStream(doc));
    req.setContentStreams(streams);
    handler.handleRequestBody(req, new SolrQueryResponse());
  }
  private void checkInternetConnection() {
    try {
      URLConnection conn = new URL("http://www.apache.org/").openConnection();
      conn.setConnectTimeout(5000);
      conn.setReadTimeout(5000);
      conn.connect();
    } catch (Exception ex) {
      assumeNoException("This test requires an internet connection", ex);
    }
  }
 }
--- a/solr/contrib/uima/src/test/resources/solr-uima/conf/protwords.txt
+++ b/solr/contrib/uima/src/test/resources/solr-uima/conf/protwords.txt
@ -0,0 +1,21 @@
 # The ASF licenses this file to You under the Apache License, Version 2.0
 # (the "License"); you may not use this file except in compliance with
 # the License.  You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #-----------------------------------------------------------------------
 # Use a protected word file to protect against the stemmer reducing two
 # unrelated words to the same base word.
 # Some non-words that normally won't be encountered,
 # just to test that they won't be stemmed.
 dontstems
 zwhacky
--- a/solr/contrib/uima/src/test/resources/solr-uima/conf/schema.xml
+++ b/solr/contrib/uima/src/test/resources/solr-uima/conf/schema.xml
@ -0,0 +1,679 @@
 <?xml version="1.0" encoding="UTF-8" ?>
  <!--
    Licensed to the Apache Software Foundation (ASF) under one or more
    contributor license agreements. See the NOTICE file distributed with
    this work for additional information regarding copyright ownership.
    The ASF licenses this file to You under the Apache License, Version
    2.0 (the "License"); you may not use this file except in compliance
    with the License. You may obtain a copy of the License at
    http://www.apache.org/licenses/LICENSE-2.0 Unless required by
    applicable law or agreed to in writing, software distributed under
    the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES
    OR CONDITIONS OF ANY KIND, either express or implied. See the
    License for the specific language governing permissions and
    limitations under the License.
  -->
  <!--
    This is the Solr schema file. This file should be named "schema.xml"
    and should be in the conf directory under the solr home (i.e.
    ./solr/conf/schema.xml by default) or located where the classloader
    for the Solr webapp can find it. This example schema is the
    recommended starting point for users. It should be kept correct and
    concise, usable out-of-the-box. For more information, on how to
    customize this file, please see
    http://wiki.apache.org/solr/SchemaXml PERFORMANCE NOTE: this schema
    includes many optional features and should not be used for
    benchmarking. To improve performance one could - set stored="false"
    for all fields possible (esp large fields) when you only need to
    search on the field but don't need to return the original value. -
    set indexed="false" if you don't need to search on the field, but
    only return the field as a result of searching on other indexed
    fields. - remove all unneeded copyField statements - for best index
    size and searching performance, set "index" to false for all general
    text fields, use copyField to copy them to the catchall "text"
    field, and use that for searching. - For maximum indexing
    performance, use the StreamingUpdateSolrServer java client. -
    Remember to run the JVM in server mode, and use a higher logging
    level that avoids logging every request
  -->
 <schema name="sample" version="1.2">
  <!--
    attribute "name" is the name of this schema and is only used for
    display purposes. Applications should change this to reflect the
    nature of the search collection. version="1.2" is Solr's version
    number for the schema syntax and semantics. It should not normally
    be changed by applications. 1.0: multiValued attribute did not
    exist, all fields are multiValued by nature 1.1: multiValued
    attribute introduced, false by default 1.2: omitTermFreqAndPositions
    attribute introduced, true by default except for text fields.
  -->
  <types>
    <!--
      field type definitions. The "name" attribute is just a label to be
      used by field definitions. The "class" attribute and any other
      attributes determine the real behavior of the fieldType. Class
      names starting with "solr" refer to java classes in the
      org.apache.solr.analysis package.
    -->
    <!--
      The StrField type is not analyzed, but indexed/stored verbatim. -
      StrField and TextField support an optional compressThreshold which
      limits compression (if enabled in the derived fields) to values
      which exceed a certain size (in characters).
    -->
    <fieldType name="string" class="solr.StrField"
      sortMissingLast="true" omitNorms="true" />
    <!-- boolean type: "true" or "false" -->
    <fieldType name="boolean" class="solr.BoolField"
      sortMissingLast="true" omitNorms="true" />
    <!--
      Binary data type. The data should be sent/retrieved in as Base64
      encoded Strings
    -->
    <fieldtype name="binary" class="solr.BinaryField" />
    <!--
      The optional sortMissingLast and sortMissingFirst attributes are
      currently supported on types that are sorted internally as
      strings. This includes
      "string","boolean","sint","slong","sfloat","sdouble","pdate" - If
      sortMissingLast="true", then a sort on this field will cause
      documents without the field to come after documents with the
      field, regardless of the requested sort order (asc or desc). - If
      sortMissingFirst="true", then a sort on this field will cause
      documents without the field to come before documents with the
      field, regardless of the requested sort order. - If
      sortMissingLast="false" and sortMissingFirst="false" (the
      default), then default lucene sorting will be used which places
      docs without the field first in an ascending sort and last in a
      descending sort.
    -->
    <!--
      Default numeric field types. For faster range queries, consider
      the tint/tfloat/tlong/tdouble types.
    -->
    <fieldType name="int" class="solr.TrieIntField"
      precisionStep="0" omitNorms="true" positionIncrementGap="0" />
    <fieldType name="float" class="solr.TrieFloatField"
      precisionStep="0" omitNorms="true" positionIncrementGap="0" />
    <fieldType name="long" class="solr.TrieLongField"
      precisionStep="0" omitNorms="true" positionIncrementGap="0" />
    <fieldType name="double" class="solr.TrieDoubleField"
      precisionStep="0" omitNorms="true" positionIncrementGap="0" />
    <!--
      Numeric field types that index each value at various levels of
      precision to accelerate range queries when the number of values
      between the range endpoints is large. See the javadoc for
      NumericRangeQuery for internal implementation details. Smaller
      precisionStep values (specified in bits) will lead to more tokens
      indexed per value, slightly larger index size, and faster range
      queries. A precisionStep of 0 disables indexing at different
      precision levels.
    -->
    <fieldType name="tint" class="solr.TrieIntField"
      precisionStep="8" omitNorms="true" positionIncrementGap="0" />
    <fieldType name="tfloat" class="solr.TrieFloatField"
      precisionStep="8" omitNorms="true" positionIncrementGap="0" />
    <fieldType name="tlong" class="solr.TrieLongField"
      precisionStep="8" omitNorms="true" positionIncrementGap="0" />
    <fieldType name="tdouble" class="solr.TrieDoubleField"
      precisionStep="8" omitNorms="true" positionIncrementGap="0" />
    <!--
      The format for this date field is of the form
      1995-12-31T23:59:59Z, and is a more restricted form of the
      canonical representation of dateTime
      http://www.w3.org/TR/xmlschema-2/#dateTime The trailing "Z"
      designates UTC time and is mandatory. Optional fractional seconds
      are allowed: 1995-12-31T23:59:59.999Z All other components are
      mandatory. Expressions can also be used to denote calculations
      that should be performed relative to "NOW" to determine the value,
      ie... NOW/HOUR ... Round to the start of the current hour NOW-1DAY
      ... Exactly 1 day prior to now NOW/DAY+6MONTHS+3DAYS ... 6 months
      and 3 days in the future from the start of the current day Consult
      the DateField javadocs for more information. Note: For faster
      range queries, consider the tdate type
    -->
    <fieldType name="date" class="solr.TrieDateField"
      omitNorms="true" precisionStep="0" positionIncrementGap="0" />
    <!--
      A Trie based date field for faster date range queries and date
      faceting.
    -->
    <fieldType name="tdate" class="solr.TrieDateField"
      omitNorms="true" precisionStep="6" positionIncrementGap="0" />
    <!--
      Note: These should only be used for compatibility with existing
      indexes (created with older Solr versions) or if
      "sortMissingFirst" or "sortMissingLast" functionality is needed.
      Use Trie based fields instead. Plain numeric field types that
      store and index the text value verbatim (and hence don't support
      range queries, since the lexicographic ordering isn't equal to the
      numeric ordering)
    -->
    <fieldType name="pint" class="solr.IntField" omitNorms="true" />
    <fieldType name="plong" class="solr.LongField" omitNorms="true" />
    <fieldType name="pfloat" class="solr.FloatField"
      omitNorms="true" />
    <fieldType name="pdouble" class="solr.DoubleField"
      omitNorms="true" />
    <fieldType name="pdate" class="solr.DateField"
      sortMissingLast="true" omitNorms="true" />
    <!--
      Note: These should only be used for compatibility with existing
      indexes (created with older Solr versions) or if
      "sortMissingFirst" or "sortMissingLast" functionality is needed.
      Use Trie based fields instead. Numeric field types that manipulate
      the value into a string value that isn't human-readable in its
      internal form, but with a lexicographic ordering the same as the
      numeric ordering, so that range queries work correctly.
    -->
    <fieldType name="sint" class="solr.SortableIntField"
      sortMissingLast="true" omitNorms="true" />
    <fieldType name="slong" class="solr.SortableLongField"
      sortMissingLast="true" omitNorms="true" />
    <fieldType name="sfloat" class="solr.SortableFloatField"
      sortMissingLast="true" omitNorms="true" />
    <fieldType name="sdouble" class="solr.SortableDoubleField"
      sortMissingLast="true" omitNorms="true" />
    <!--
      The "RandomSortField" is not used to store or search any data. You
      can declare fields of this type it in your schema to generate
      pseudo-random orderings of your docs for sorting purposes. The
      ordering is generated based on the field name and the version of
      the index, As long as the index version remains unchanged, and the
      same field name is reused, the ordering of the docs will be
      consistent. If you want different psuedo-random orderings of
      documents, for the same version of the index, use a dynamicField
      and change the name
    -->
    <fieldType name="random" class="solr.RandomSortField"
      indexed="true" />
    <!--
      solr.TextField allows the specification of custom text analyzers
      specified as a tokenizer and a list of token filters. Different
      analyzers may be specified for indexing and querying. The optional
      positionIncrementGap puts space between multiple fields of this
      type on the same document, with the purpose of preventing false
      phrase matching across fields. For more info on customizing your
      analyzer chain, please see
      http://wiki.apache.org/solr/AnalyzersTokenizersTokenFilters
    -->
    <!--
      One can also specify an existing Analyzer class that has a default
      constructor via the class attribute on the analyzer element
      <fieldType name="text_greek" class="solr.TextField"> <analyzer
      class="org.apache.lucene.analysis.el.GreekAnalyzer"/> </fieldType>
    -->
    <!--
      A text field that only splits on whitespace for exact matching of
      words
    -->
    <fieldType name="text_ws" class="solr.TextField"
      positionIncrementGap="100">
      <analyzer>
        <tokenizer class="solr.WhitespaceTokenizerFactory" />
      </analyzer>
    </fieldType>
    <!--
      A text field that uses WordDelimiterFilter to enable splitting and
      matching of words on case-change, alpha numeric boundaries, and
      non-alphanumeric chars, so that a query of "wifi" or "wi fi" could
      match a document containing "Wi-Fi". Synonyms and stopwords are
      customized by external files, and stemming is enabled.
    -->
    <fieldType name="text" class="solr.TextField"
      positionIncrementGap="100">
      <analyzer type="index">
        <tokenizer class="solr.WhitespaceTokenizerFactory" />
        <!--
          in this example, we will only use synonyms at query time
          <filter class="solr.SynonymFilterFactory"
          synonyms="index_synonyms.txt" ignoreCase="true"
          expand="false"/>
        -->
        <!--
          Case insensitive stop word removal. add
          enablePositionIncrements=true in both the index and query
          analyzers to leave a 'gap' for more accurate phrase queries.
        -->
        <filter class="solr.StopFilterFactory" ignoreCase="true"
          words="stopwords.txt" enablePositionIncrements="true" />
        <filter class="solr.WordDelimiterFilterFactory"
          generateWordParts="1" generateNumberParts="1" catenateWords="1"
          catenateNumbers="1" catenateAll="0" splitOnCaseChange="1" />
        <filter class="solr.LowerCaseFilterFactory" />
      </analyzer>
      <analyzer type="query">
        <tokenizer class="solr.WhitespaceTokenizerFactory" />
        <filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt"
          ignoreCase="true" expand="true" />
        <filter class="solr.StopFilterFactory" ignoreCase="true"
          words="stopwords.txt" enablePositionIncrements="true" />
        <filter class="solr.WordDelimiterFilterFactory"
          generateWordParts="1" generateNumberParts="1" catenateWords="0"
          catenateNumbers="0" catenateAll="0" splitOnCaseChange="1" />
        <filter class="solr.LowerCaseFilterFactory" />
      </analyzer>
    </fieldType>
    <!--
      Less flexible matching, but less false matches. Probably not ideal
      for product names, but may be good for SKUs. Can insert dashes in
      the wrong place and still match.
    -->
    <fieldType name="textTight" class="solr.TextField"
      positionIncrementGap="100">
      <analyzer>
        <tokenizer class="solr.WhitespaceTokenizerFactory" />
        <filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt"
          ignoreCase="true" expand="false" />
        <filter class="solr.StopFilterFactory" ignoreCase="true"
          words="stopwords.txt" />
        <filter class="solr.WordDelimiterFilterFactory"
          generateWordParts="0" generateNumberParts="0" catenateWords="1"
          catenateNumbers="1" catenateAll="0" />
        <filter class="solr.LowerCaseFilterFactory" />
        <!--
          this filter can remove any duplicate tokens that appear at the
          same position - sometimes possible with WordDelimiterFilter in
          conjuncton with stemming.
        -->
        <filter class="solr.RemoveDuplicatesTokenFilterFactory" />
      </analyzer>
    </fieldType>
    <!--
      A general unstemmed text field - good if one does not know the
      language of the field
    -->
    <fieldType name="textgen" class="solr.TextField"
      positionIncrementGap="100">
      <analyzer type="index">
        <tokenizer class="solr.WhitespaceTokenizerFactory" />
        <filter class="solr.StopFilterFactory" ignoreCase="true"
          words="stopwords.txt" enablePositionIncrements="true" />
        <filter class="solr.WordDelimiterFilterFactory"
          generateWordParts="1" generateNumberParts="1" catenateWords="1"
          catenateNumbers="1" catenateAll="0" splitOnCaseChange="0" />
        <filter class="solr.LowerCaseFilterFactory" />
      </analyzer>
      <analyzer type="query">
        <tokenizer class="solr.WhitespaceTokenizerFactory" />
        <filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt"
          ignoreCase="true" expand="true" />
        <filter class="solr.StopFilterFactory" ignoreCase="true"
          words="stopwords.txt" enablePositionIncrements="true" />
        <filter class="solr.WordDelimiterFilterFactory"
          generateWordParts="1" generateNumberParts="1" catenateWords="0"
          catenateNumbers="0" catenateAll="0" splitOnCaseChange="0" />
        <filter class="solr.LowerCaseFilterFactory" />
      </analyzer>
    </fieldType>
    <!--
      A general unstemmed text field that indexes tokens normally and
      also reversed (via ReversedWildcardFilterFactory), to enable more
      efficient leading wildcard queries.
    -->
    <fieldType name="text_rev" class="solr.TextField"
      positionIncrementGap="100">
      <analyzer type="index">
        <tokenizer class="solr.WhitespaceTokenizerFactory" />
        <filter class="solr.StopFilterFactory" ignoreCase="true"
          words="stopwords.txt" enablePositionIncrements="true" />
        <filter class="solr.WordDelimiterFilterFactory"
          generateWordParts="1" generateNumberParts="1" catenateWords="1"
          catenateNumbers="1" catenateAll="0" splitOnCaseChange="0" />
        <filter class="solr.LowerCaseFilterFactory" />
        <filter class="solr.ReversedWildcardFilterFactory"
          withOriginal="true" maxPosAsterisk="3" maxPosQuestion="2"
          maxFractionAsterisk="0.33" />
      </analyzer>
      <analyzer type="query">
        <tokenizer class="solr.WhitespaceTokenizerFactory" />
        <filter class="solr.SynonymFilterFactory" synonyms="synonyms.txt"
          ignoreCase="true" expand="true" />
        <filter class="solr.StopFilterFactory" ignoreCase="true"
          words="stopwords.txt" enablePositionIncrements="true" />
        <filter class="solr.WordDelimiterFilterFactory"
          generateWordParts="1" generateNumberParts="1" catenateWords="0"
          catenateNumbers="0" catenateAll="0" splitOnCaseChange="0" />
        <filter class="solr.LowerCaseFilterFactory" />
      </analyzer>
    </fieldType>
    <!-- charFilter + WhitespaceTokenizer  -->
    <!--
      <fieldType name="textCharNorm" class="solr.TextField"
      positionIncrementGap="100" > <analyzer> <charFilter
      class="solr.MappingCharFilterFactory"
      mapping="mapping-ISOLatin1Accent.txt"/> <tokenizer
      class="solr.WhitespaceTokenizerFactory"/> </analyzer> </fieldType>
    -->
    <!--
      This is an example of using the KeywordTokenizer along With
      various TokenFilterFactories to produce a sortable field that does
      not include some properties of the source text
    -->
    <fieldType name="alphaOnlySort" class="solr.TextField"
      sortMissingLast="true" omitNorms="true">
      <analyzer>
        <!--
          KeywordTokenizer does no actual tokenizing, so the entire
          input string is preserved as a single token
        -->
        <tokenizer class="solr.KeywordTokenizerFactory" />
        <!--
          The LowerCase TokenFilter does what you expect, which can be
          when you want your sorting to be case insensitive
        -->
        <filter class="solr.LowerCaseFilterFactory" />
        <!-- The TrimFilter removes any leading or trailing whitespace -->
        <filter class="solr.TrimFilterFactory" />
        <!--
          The PatternReplaceFilter gives you the flexibility to use Java
          Regular expression to replace any sequence of characters
          matching a pattern with an arbitrary replacement string, which
          may include back references to portions of the original string
          matched by the pattern. See the Java Regular Expression
          documentation for more information on pattern and replacement
          string syntax.
          http://java.sun.com/j2se/1.5.0/docs/api/java/util/regex/package-summary.html
        -->
        <filter class="solr.PatternReplaceFilterFactory" pattern="([^a-z])"
          replacement="" replace="all" />
      </analyzer>
    </fieldType>
    <fieldtype name="phonetic" stored="false" indexed="true"
      class="solr.TextField">
      <analyzer>
        <tokenizer class="solr.StandardTokenizerFactory" />
        <filter class="solr.DoubleMetaphoneFilterFactory" inject="false" />
      </analyzer>
    </fieldtype>
    <fieldtype name="payloads" stored="false" indexed="true"
      class="solr.TextField">
      <analyzer>
        <tokenizer class="solr.WhitespaceTokenizerFactory" />
        <!--
          The DelimitedPayloadTokenFilter can put payloads on tokens...
          for example, a token of "foo|1.4" would be indexed as "foo"
          with a payload of 1.4f Attributes of the
          DelimitedPayloadTokenFilterFactory : "delimiter" - a one
          character delimiter. Default is | (pipe) "encoder" - how to
          encode the following value into a playload float ->
          org.apache.lucene.analysis.payloads.FloatEncoder, integer ->
          o.a.l.a.p.IntegerEncoder identity -> o.a.l.a.p.IdentityEncoder
          Fully Qualified class name implementing PayloadEncoder,
          Encoder must have a no arg constructor.
        -->
        <filter class="solr.DelimitedPayloadTokenFilterFactory"
          encoder="float" />
      </analyzer>
    </fieldtype>
    <!--
      lowercases the entire field value, keeping it as a single token.
    -->
    <fieldType name="lowercase" class="solr.TextField"
      positionIncrementGap="100">
      <analyzer>
        <tokenizer class="solr.KeywordTokenizerFactory" />
        <filter class="solr.LowerCaseFilterFactory" />
      </analyzer>
    </fieldType>
    <!--
      since fields of this type are by default not stored or indexed,
      any data added to them will be ignored outright.
    -->
    <fieldtype name="ignored" stored="false" indexed="false"
      multiValued="true" class="solr.StrField" />
  </types>
  <fields>
    <!--
      Valid attributes for fields: name: mandatory - the name for the
      field type: mandatory - the name of a previously defined type from
      the <types> section indexed: true if this field should be indexed
      (searchable or sortable) stored: true if this field should be
      retrievable compressed: [false] if this field should be stored
      using gzip compression (this will only apply if the field type is
      compressable; among the standard field types, only TextField and
      StrField are) multiValued: true if this field may contain multiple
      values per document omitNorms: (expert) set to true to omit the
      norms associated with this field (this disables length
      normalization and index-time boosting for the field, and saves
      some memory). Only full-text fields or fields that need an
      index-time boost need norms. termVectors: [false] set to true to
      store the term vector for a given field. When using MoreLikeThis,
      fields used for similarity should be stored for best performance.
      termPositions: Store position information with the term vector.
      This will increase storage costs. termOffsets: Store offset
      information with the term vector. This will increase storage
      costs. default: a value that should be used if no value is
      specified when adding a document.
    -->
    <field name="id" type="string" indexed="true" stored="true"
      required="true" />
    <field name="sku" type="textTight" indexed="true" stored="true"
      omitNorms="true" />
    <field name="name" type="textgen" indexed="true" stored="true" />
    <field name="alphaNameSort" type="alphaOnlySort" indexed="true"
      stored="false" />
    <field name="manu" type="textgen" indexed="true" stored="true"
      omitNorms="true" />
    <field name="cat" type="text_ws" indexed="true" stored="true"
      multiValued="true" omitNorms="true" />
    <field name="features" type="text" indexed="true" stored="true"
      multiValued="true" />
    <field name="includes" type="text" indexed="true" stored="true"
      termVectors="true" termPositions="true" termOffsets="true" />
    <field name="weight" type="float" indexed="true" stored="true" />
    <field name="price" type="float" indexed="true" stored="true" />
    <field name="popularity" type="int" indexed="true" stored="true" />
    <field name="inStock" type="boolean" indexed="true" stored="true" />
    <!--
      Common metadata fields, named specifically to match up with
      SolrCell metadata when parsing rich documents such as Word, PDF.
      Some fields are multiValued only because Tika currently may return
      multiple values for them.
    -->
    <field name="title" type="text" indexed="true" stored="true"
      multiValued="true" />
    <field name="subject" type="text" indexed="true" stored="true" />
    <field name="description" type="text" indexed="true" stored="true" />
    <field name="comments" type="text" indexed="true" stored="true" />
    <field name="author" type="textgen" indexed="true" stored="true" />
    <field name="keywords" type="textgen" indexed="true" stored="true" />
    <field name="category" type="textgen" indexed="true" stored="true" />
    <field name="content_type" type="string" indexed="true"
      stored="true" multiValued="true" />
    <field name="last_modified" type="date" indexed="true" stored="true" />
    <field name="links" type="string" indexed="true" stored="true"
      multiValued="true" />
    <!--
      catchall field, containing all other searchable text fields
      (implemented via copyField further on in this schema
    -->
    <field name="text" type="text" indexed="true" stored="false"
      multiValued="true" />
    <!--
      catchall text field that indexes tokens both normally and in
      reverse for efficient leading wildcard queries.
    -->
    <field name="text_rev" type="text_rev" indexed="true" stored="false"
      multiValued="true" />
    <!--
      non-tokenized version of manufacturer to make it easier to sort or
      group results by manufacturer. copied from "manu" via copyField
    -->
    <field name="manu_exact" type="string" indexed="true" stored="false" />
    <field name="payloads" type="payloads" indexed="true" stored="true" />
    <!--
      Uncommenting the following will create a "timestamp" field using a
      default value of "NOW" to indicate when each document was indexed.
    -->
    <!--
      <field name="timestamp" type="date" indexed="true" stored="true"
      default="NOW" multiValued="false"/>
    -->
  <field name="language" type="string" indexed="true" stored="true" required="false"/>
  <field name="concept" type="string" indexed="true" stored="true" multiValued="true" required="false"/>
  <field name="keyword" type="string" indexed="true" stored="true" multiValued="true" required="false"/>
  <field name="suggested_category" type="string" indexed="true" stored="true" multiValued="false" required="false"/>
  <field name="sentence" type="text" indexed="true" stored="true" multiValued="true" required="false" />
  <dynamicField name="entity*" type="text" indexed="true" stored="true" multiValued="true"/>
    <!--
      Dynamic field definitions. If a field name is not found,
      dynamicFields will be used if the name matches any of the
      patterns. RESTRICTION: the glob-like pattern in the name attribute
      must have a "*" only at the start or the end. EXAMPLE: name="*_i"
      will match any field ending in _i (like myid_i, z_i) Longer
      patterns will be matched first. if equal size patterns both match,
      the first appearing in the schema will be used. <dynamicField
      name="*_i" type="int" indexed="true" stored="true"/> <dynamicField
      name="*_s" type="string" indexed="true" stored="true"/>
      <dynamicField name="*_l" type="long" indexed="true"
      stored="true"/> <dynamicField name="*_t" type="text"
      indexed="true" stored="true"/> <dynamicField name="*_b"
      type="boolean" indexed="true" stored="true"/> <dynamicField
      name="*_f" type="float" indexed="true" stored="true"/>
      <dynamicField name="*_d" type="double" indexed="true"
      stored="true"/> <dynamicField name="*_dt" type="date"
      indexed="true" stored="true"/> <dynamicField name="*_ti"
      type="tint" indexed="true" stored="true"/> <dynamicField
      name="*_tl" type="tlong" indexed="true" stored="true"/>
      <dynamicField name="*_tf" type="tfloat" indexed="true"
      stored="true"/> <dynamicField name="*_td" type="tdouble"
      indexed="true" stored="true"/> <dynamicField name="*_tdt"
      type="tdate" indexed="true" stored="true"/> <dynamicField
      name="*_pi" type="pint" indexed="true" stored="true"/>
      <dynamicField name="ignored_*" type="ignored" multiValued="true"/>
      <dynamicField name="attr_*" type="textgen" indexed="true"
      stored="true" multiValued="true"/> <dynamicField name="random_*"
      type="random" />
    -->
    <!--
      uncomment the following to ignore any fields that don't already
      match an existing field name or dynamic field, rather than
      reporting them as an error. alternately, change the type="ignored"
      to some other type e.g. "text" if you want unknown fields indexed
      and/or stored by default
    -->
    <!--dynamicField name="*" type="ignored" multiValued="true" /-->
  </fields>
  <!--
    Field to use to determine and enforce document uniqueness. Unless
    this field is marked with required="false", it will be a required
    field
  -->
  <uniqueKey>id</uniqueKey>
  <!--
    field for the QueryParser to use when an explicit fieldname is
    absent
  -->
  <defaultSearchField>text</defaultSearchField>
  <!-- SolrQueryParser configuration: defaultOperator="AND|OR" -->
  <solrQueryParser defaultOperator="OR" />
  <!--
    copyField commands copy one field to another at the time a document
    is added to the index. It's used either to index the same field
    differently, or to add multiple fields to the same field for
    easier/faster searching.
  -->
  <copyField source="cat" dest="text" />
  <copyField source="name" dest="text" />
  <copyField source="manu" dest="text" />
  <copyField source="features" dest="text" />
  <copyField source="includes" dest="text" />
  <copyField source="manu" dest="manu_exact" />
  <!--copyField source="Titolo" dest="text"/-->
  <!--
    Above, multiple source fields are copied to the [text] field.
    Another way to map multiple source fields to the same destination
    field is to use the dynamic field syntax. copyField also supports a
    maxChars to copy setting.
  -->
  <!-- <copyField source="*_t" dest="text" maxChars="3000"/> -->
  <!--
    copy name to alphaNameSort, a field designed for sorting by name
  -->
  <!-- <copyField source="name" dest="alphaNameSort"/> -->
  <!--
    Similarity is the scoring routine for each document vs. a query. A
    custom similarity may be specified here, but the default is fine for
    most applications.
  -->
  <!--
    <similarity class="org.apache.lucene.search.DefaultSimilarity"/>
  -->
  <!--
    ... OR ... Specify a SimilarityFactory class name implementation
    allowing parameters to be used.
  -->
  <!--
    <similarity class="com.example.solr.CustomSimilarityFactory"> <str
    name="paramkey">param value</str> </similarity>
  -->
 </schema>
--- a/solr/contrib/uima/src/test/resources/solr-uima/conf/solrconfig.xml
+++ b/solr/contrib/uima/src/test/resources/solr-uima/conf/solrconfig.xml
--- a/solr/contrib/uima/src/test/resources/solr-uima/conf/spellings.txt
+++ b/solr/contrib/uima/src/test/resources/solr-uima/conf/spellings.txt
@ -0,0 +1,2 @@
 pizza
 history
--- a/solr/contrib/uima/src/test/resources/solr-uima/conf/stopwords.txt
+++ b/solr/contrib/uima/src/test/resources/solr-uima/conf/stopwords.txt
@ -0,0 +1,58 @@
 # Licensed to the Apache Software Foundation (ASF) under one or more
 # contributor license agreements.  See the NOTICE file distributed with
 # this work for additional information regarding copyright ownership.
 # The ASF licenses this file to You under the Apache License, Version 2.0
 # (the "License"); you may not use this file except in compliance with
 # the License.  You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #-----------------------------------------------------------------------
 # a couple of test stopwords to test that the words are really being
 # configured from this file:
 stopworda
 stopwordb
 #Standard english stop words taken from Lucene's StopAnalyzer
 a
 an
 and
 are
 as
 at
 be
 but
 by
 for
 if
 in
 into
 is
 it
 no
 not
 of
 on
 or
 s
 such
 t
 that
 the
 their
 then
 there
 these
 they
 this
 to
 was
 will
 with
--- a/solr/contrib/uima/src/test/resources/solr-uima/conf/synonyms.txt
+++ b/solr/contrib/uima/src/test/resources/solr-uima/conf/synonyms.txt
@ -0,0 +1,31 @@
 # The ASF licenses this file to You under the Apache License, Version 2.0
 # (the "License"); you may not use this file except in compliance with
 # the License.  You may obtain a copy of the License at
 #
 #     http://www.apache.org/licenses/LICENSE-2.0
 #
 # Unless required by applicable law or agreed to in writing, software
 # distributed under the License is distributed on an "AS IS" BASIS,
 # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
 # See the License for the specific language governing permissions and
 # limitations under the License.
 #-----------------------------------------------------------------------
 #some test synonym mappings unlikely to appear in real input text
 aaa => aaaa
 bbb => bbbb1 bbbb2
 ccc => cccc1,cccc2
 a\=>a => b\=>b
 a\,a => b\,b
 fooaaa,baraaa,bazaaa
 # Some synonym groups specific to this example
 GB,gib,gigabyte,gigabytes
 MB,mib,megabyte,megabytes
 Television, Televisions, TV, TVs
 #notice we use "gib" instead of "GiB" so any WordDelimiterFilter coming
 #after us won't split it into two words.
 # Synonym mappings can be used for spelling correction too
 pixima => pixma
		`@ -0,0 +1,2 @@`
							`AnyObjectId[9c8bd13a2002a9ff5b35b873b9f111d5281ad201] was removed in git history.`
							`Apache SVN contains full history.`
		`@ -0,0 +1,2 @@`
							`AnyObjectId[532939ecab6b77ccb77af3635c55ff9752b70ab7] was removed in git history.`
							`Apache SVN contains full history.`
		`@ -0,0 +1,2 @@`
							`AnyObjectId[33165678da937e03cb069449b40f1cf690beda0a] was removed in git history.`
							`Apache SVN contains full history.`
		`@ -0,0 +1,2 @@`
							`AnyObjectId[5dfc32bce5e444a9bb3387d664485f7bfdc438ad] was removed in git history.`
							`Apache SVN contains full history.`
		`@ -0,0 +1,2 @@`
							`AnyObjectId[bf90c19d2c1f77e300b94363385841ec1225b4b9] was removed in git history.`
							`Apache SVN contains full history.`
		`@ -0,0 +1,2 @@`
							`AnyObjectId[9518da64cdf5d378273ab40a06823a7768f18ece] was removed in git history.`
							`Apache SVN contains full history.`
		`@ -0,0 +1,2 @@`
							`AnyObjectId[72991424bdfe4776f66feab7ff4e8564f12d2659] was removed in git history.`
							`Apache SVN contains full history.`