mirror of https://github.com/apache/lucene.git
LUCENE-3312: Merged revision(s) 1366639-1371131 from lucene/dev/trunk:
SOLR-3259: default /get to json ........ minor tweaks to update script example ........ LUCENE-4268: Rename ResourceAsStreamReasourceLoader to ClasspathResourceLoader, provide FilesystemResourceLoader, bug fixing ........ LUCENE-4268: Fix test bug ........ SOLR-3648: Fix Velocity template loading in SolrCloud mode ........ fix confusing IW infoStream message ........ Fix rawtypes warning in java 7 and 8, make the SuppressWarnings more local ........ Nicer solution to generic array creation (still problematic in Java 6, but correct in Java 7 if done this way) ........ Disable test failing with Java 8 ........ Allow detecting of Java 8 ........ LUCENE-4109: BooleanQueries are not parsed correctly with the flexible queryparser ........ LUCENE-4269: remove BalancedSegmentMergePolicy (use TieredMergePolicy instead) ........ LUCENE-4269: deprecate BalancedSegmentMergePolicy (use TieredMergePolicy instead) ........ LUCENE-4190: restrict allowed filenames to reduce risk of deleting non-lucene file from the index directory ........ fix the monkey: connection loss and expiration cause NPE ........ upgrade checkJavaDocs.py to python3 ........ LUCENE-3884: Move ElisionFilter out of .fr package ........ fix encoding in javadocs checker ........ LUCENE-2501: fix thread hazard when threads add same field with different IndexOptions at the same time ........ git-svn-id: https://svn.apache.org/repos/asf/lucene/dev/branches/lucene3312@1371142 13f79535-47bb-0310-9956-ffa450edef68
This commit is contained in:
commit
148d99cbbc
65
build.xml
65
build.xml
|
@ -176,22 +176,57 @@
|
|||
</subant>
|
||||
</target>
|
||||
|
||||
<target name="jar-checksums" depends="resolve" description="Recompute SHA1 checksums for all JAR files.">
|
||||
<delete>
|
||||
<fileset dir="${basedir}">
|
||||
<include name="**/*.jar.sha1"/>
|
||||
</fileset>
|
||||
</delete>
|
||||
<target name="jar-checksums" description="Recompute SHA1 checksums for all JAR files.">
|
||||
<sequential>
|
||||
<subant target="jar-checksums" inheritall="false" failonerror="true">
|
||||
<fileset dir="lucene" includes="build.xml" />
|
||||
<fileset dir="solr" includes="build.xml" />
|
||||
</subant>
|
||||
</sequential>
|
||||
</target>
|
||||
|
||||
<checksum algorithm="SHA1" fileext=".sha1">
|
||||
<fileset dir="${basedir}">
|
||||
<include name="**/*.jar"/>
|
||||
</fileset>
|
||||
</checksum>
|
||||
<property name="python32.exe" value="python3.2" />
|
||||
<property name="JAVA6_HOME" value="/usr/local/jdk1.6.0_27"/>
|
||||
<property name="JAVA7_HOME" value="/usr/local/jdk1.7.0_01"/>
|
||||
<property name="fakeRelease" value="lucene/build/fakeRelease"/>
|
||||
<property name="fakeReleaseTmp" value="lucene/build/fakeReleaseTmp"/>
|
||||
<property name="fakeReleaseVersion" value="5.0"/> <!-- *not* -SNAPSHOT, the real version -->
|
||||
|
||||
<fixcrlf
|
||||
srcdir="${basedir}"
|
||||
includes="**/*.jar.sha1"
|
||||
eol="lf" fixlast="true" encoding="US-ASCII" />
|
||||
<target name="nightly-smoke" description="Builds an unsigned release and smoke tests it." depends="clean">
|
||||
<sequential>
|
||||
<subant target="prepare-release-no-sign" inheritall="false" failonerror="true">
|
||||
<fileset dir="lucene" includes="build.xml" />
|
||||
<fileset dir="solr" includes="build.xml" />
|
||||
<property name="version" value="${fakeReleaseVersion}" />
|
||||
</subant>
|
||||
<delete dir="${fakeRelease}"/>
|
||||
<delete dir="${fakeReleaseTmp}"/>
|
||||
<mkdir dir="${fakeRelease}"/>
|
||||
<copy todir="${fakeRelease}/lucene">
|
||||
<fileset dir="lucene/dist"/>
|
||||
</copy>
|
||||
<copy todir="${fakeRelease}/lucene/changes">
|
||||
<fileset dir="lucene/build/docs/changes"/>
|
||||
</copy>
|
||||
<get src="http://people.apache.org/keys/group/lucene.asc"
|
||||
dest="${fakeRelease}/lucene/KEYS"/>
|
||||
<copy todir="${fakeRelease}/solr">
|
||||
<fileset dir="solr/package"/>
|
||||
</copy>
|
||||
<copy file="${fakeRelease}/lucene/KEYS" todir="${fakeRelease}/solr"/>
|
||||
<makeurl file="${fakeRelease}" validate="false" property="fakeRelease.uri"/>
|
||||
<exec executable="${python32.exe}" failonerror="true">
|
||||
<arg value="-u"/>
|
||||
<arg value="dev-tools/scripts/smokeTestRelease.py"/>
|
||||
<arg value="${fakeRelease.uri}"/>
|
||||
<arg value="${fakeReleaseVersion}"/>
|
||||
<arg value="${fakeReleaseTmp}"/>
|
||||
<arg value="false"/>
|
||||
<env key="JAVA6_HOME" value="${JAVA6_HOME}"/>
|
||||
<env key="JAVA7_HOME" value="${JAVA7_HOME}"/>
|
||||
</exec>
|
||||
<delete dir="${fakeRelease}"/>
|
||||
<delete dir="${fakeReleaseTmp}"/>
|
||||
</sequential>
|
||||
</target>
|
||||
</project>
|
||||
|
|
|
@ -15,30 +15,30 @@
|
|||
<classpathentry kind="src" path="lucene/sandbox/src/java"/>
|
||||
<classpathentry kind="src" path="lucene/sandbox/src/test"/>
|
||||
<classpathentry kind="src" path="lucene/test-framework/src/java"/>
|
||||
<classpathentry kind="src" output="bin.tests-framework" path="lucene/test-framework/src/resources"/>
|
||||
<classpathentry kind="src" output="bin/tests-framework" path="lucene/test-framework/src/resources"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/common/src/java"/>
|
||||
<classpathentry kind="src" output="bin.analysis-common" path="lucene/analysis/common/src/resources"/>
|
||||
<classpathentry kind="src" output="bin/analysis-common" path="lucene/analysis/common/src/resources"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/common/src/test"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/icu/src/java"/>
|
||||
<classpathentry kind="src" output="bin.analysis-icu" path="lucene/analysis/icu/src/resources"/>
|
||||
<classpathentry kind="src" output="bin/analysis-icu" path="lucene/analysis/icu/src/resources"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/icu/src/test"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/kuromoji/src/java"/>
|
||||
<classpathentry kind="src" output="bin.analysis-kuromoji" path="lucene/analysis/kuromoji/src/resources"/>
|
||||
<classpathentry kind="src" output="bin/analysis-kuromoji" path="lucene/analysis/kuromoji/src/resources"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/kuromoji/src/test"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/phonetic/src/java"/>
|
||||
<classpathentry kind="src" output="bin.analysis-phonetic" path="lucene/analysis/phonetic/src/resources"/>
|
||||
<classpathentry kind="src" output="bin/analysis-phonetic" path="lucene/analysis/phonetic/src/resources"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/phonetic/src/test"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/smartcn/src/java"/>
|
||||
<classpathentry kind="src" output="bin.analysis-smartcn" path="lucene/analysis/smartcn/src/resources"/>
|
||||
<classpathentry kind="src" output="bin/analysis-smartcn" path="lucene/analysis/smartcn/src/resources"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/smartcn/src/test"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/stempel/src/java"/>
|
||||
<classpathentry kind="src" output="bin.analysis-stempel" path="lucene/analysis/stempel/src/resources"/>
|
||||
<classpathentry kind="src" output="bin/analysis-stempel" path="lucene/analysis/stempel/src/resources"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/stempel/src/test"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/morfologik/src/java"/>
|
||||
<classpathentry kind="src" output="bin.analysis-morfologik" path="lucene/analysis/morfologik/src/resources"/>
|
||||
<classpathentry kind="src" output="bin/analysis-morfologik" path="lucene/analysis/morfologik/src/resources"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/morfologik/src/test"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/uima/src/java"/>
|
||||
<classpathentry kind="src" output="bin.analysis-uima" path="lucene/analysis/uima/src/resources"/>
|
||||
<classpathentry kind="src" output="bin/analysis-uima" path="lucene/analysis/uima/src/resources"/>
|
||||
<classpathentry kind="src" path="lucene/analysis/uima/src/test"/>
|
||||
<classpathentry kind="src" path="lucene/benchmark/src/java"/>
|
||||
<classpathentry kind="src" path="lucene/benchmark/src/test"/>
|
||||
|
@ -120,7 +120,7 @@
|
|||
<classpathentry kind="lib" path="solr/lib/slf4j-api-1.6.4.jar"/>
|
||||
<classpathentry kind="lib" path="solr/lib/slf4j-jdk14-1.6.4.jar"/>
|
||||
<classpathentry kind="lib" path="solr/lib/wstx-asl-3.2.7.jar"/>
|
||||
<classpathentry kind="lib" path="solr/lib/zookeeper-3.3.5.jar"/>
|
||||
<classpathentry kind="lib" path="solr/lib/zookeeper-3.3.6.jar"/>
|
||||
<classpathentry kind="lib" path="solr/example/lib/jetty-continuation-8.1.2.v20120308.jar"/>
|
||||
<classpathentry kind="lib" path="solr/example/lib/jetty-deploy-8.1.2.v20120308.jar"/>
|
||||
<classpathentry kind="lib" path="solr/example/lib/jetty-http-8.1.2.v20120308.jar"/>
|
||||
|
@ -175,5 +175,5 @@
|
|||
<classpathentry kind="lib" path="solr/contrib/velocity/lib/commons-collections-3.2.1.jar"/>
|
||||
<classpathentry kind="con" path="org.eclipse.jdt.launching.JRE_CONTAINER"/>
|
||||
<classpathentry kind="lib" path="lucene/test-framework/lib/randomizedtesting-runner-1.6.0.jar"/>
|
||||
<classpathentry kind="output" path="bin"/>
|
||||
<classpathentry kind="output" path="bin/other"/>
|
||||
</classpath>
|
||||
|
|
|
@ -36,27 +36,25 @@ A. How to use nightly Jenkins-built Lucene/Solr Maven artifacts
|
|||
|
||||
B. How to generate Lucene/Solr Maven artifacts
|
||||
|
||||
Prerequisites: JDK 1.6+ and Ant 1.7.X
|
||||
Prerequisites: JDK 1.6+ and Ant 1.8.2+
|
||||
|
||||
Run 'ant generate-maven-artifacts' to create an internal Maven
|
||||
repository, including POMs, binary .jars, source .jars, and javadoc
|
||||
.jars.
|
||||
|
||||
You can run the above command in four possible places: the top-level
|
||||
directory; under lucene/; under solr/; or under modules/. From the
|
||||
top-level directory, from lucene/, or from modules/, the internal
|
||||
repository will be located at dist/maven/. From solr/, the internal
|
||||
repository will be located at package/maven/.
|
||||
You can run the above command in three possible places: the top-level
|
||||
directory; under lucene/; or under solr/. From the top-level directory
|
||||
or from lucene/, the internal repository will be located at dist/maven/.
|
||||
From solr/, the internal repository will be located at package/maven/.
|
||||
|
||||
|
||||
C. How to deploy Maven artifacts to a repository
|
||||
|
||||
Prerequisites: JDK 1.6+ and Ant 1.7.X
|
||||
Prerequisites: JDK 1.6+ and Ant 1.8.2+
|
||||
|
||||
You can deploy targets for all of Lucene/Solr, only Lucene, only Solr,
|
||||
or only modules/, as in B. above. To deploy to a Maven repository, the
|
||||
command is the same as in B. above, with the addition of two system
|
||||
properties:
|
||||
You can deploy targets for all of Lucene/Solr, only Lucene, or only Solr,
|
||||
as in B. above. To deploy to a Maven repository, the command is the same
|
||||
as in B. above, with the addition of two system properties:
|
||||
|
||||
ant -Dm2.repository.id=my-repo-id \
|
||||
-Dm2.repository.url=http://example.org/my/repo \
|
||||
|
@ -101,7 +99,7 @@ D. How to use Maven to build Lucene/Solr
|
|||
the default, you can supply an alternate version on the command line
|
||||
with the above command, e.g.:
|
||||
|
||||
ant -Dversion=5.0-my-special-version get-maven-poms
|
||||
ant -Dversion=my-special-version get-maven-poms
|
||||
|
||||
Note: if you change the version in the POMs, there is one test method
|
||||
that will fail under maven-surefire-plugin:
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
@ -77,33 +71,5 @@
|
|||
</excludes>
|
||||
</testResource>
|
||||
</testResources>
|
||||
<plugins>
|
||||
<plugin>
|
||||
<groupId>org.codehaus.mojo</groupId>
|
||||
<artifactId>appassembler-maven-plugin</artifactId>
|
||||
<configuration>
|
||||
<extraJvmArguments>-Xmx128M</extraJvmArguments>
|
||||
<repositoryLayout>flat</repositoryLayout>
|
||||
<platforms>
|
||||
<platform>windows</platform>
|
||||
<platform>unix</platform>
|
||||
</platforms>
|
||||
<programs>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.analysis.charfilter.HtmlStripCharFilter</mainClass>
|
||||
<name>HtmlStripCharFilter</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.analysis.en.PorterStemmer</mainClass>
|
||||
<name>EnglishPorterStemmer</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.tartarus.snowball.TestApp</mainClass>
|
||||
<name>SnowballTestApp</name>
|
||||
</program>
|
||||
</programs>
|
||||
</configuration>
|
||||
</plugin>
|
||||
</plugins>
|
||||
</build>
|
||||
</project>
|
||||
|
|
|
@ -40,15 +40,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -39,15 +39,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -39,15 +39,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
@ -75,6 +69,11 @@
|
|||
<build>
|
||||
<sourceDirectory>${module-path}/src/java</sourceDirectory>
|
||||
<testSourceDirectory>${module-path}/src/test</testSourceDirectory>
|
||||
<resources>
|
||||
<resource>
|
||||
<directory>${module-path}/src/resources</directory>
|
||||
</resource>
|
||||
</resources>
|
||||
<testResources>
|
||||
<testResource>
|
||||
<directory>${project.build.testSourceDirectory}</directory>
|
||||
|
|
|
@ -39,15 +39,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
@ -75,6 +69,11 @@
|
|||
<build>
|
||||
<sourceDirectory>${module-path}/src/java</sourceDirectory>
|
||||
<testSourceDirectory>${module-path}/src/test</testSourceDirectory>
|
||||
<resources>
|
||||
<resource>
|
||||
<directory>${module-path}/src/resources</directory>
|
||||
</resource>
|
||||
</resources>
|
||||
<testResources>
|
||||
<testResource>
|
||||
<directory>${project.build.testSourceDirectory}</directory>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -41,15 +41,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
@ -120,41 +114,5 @@
|
|||
</includes>
|
||||
</testResource>
|
||||
</testResources>
|
||||
<plugins>
|
||||
<plugin>
|
||||
<groupId>org.codehaus.mojo</groupId>
|
||||
<artifactId>appassembler-maven-plugin</artifactId>
|
||||
<configuration>
|
||||
<extraJvmArguments>-Xmx128M</extraJvmArguments>
|
||||
<repositoryLayout>flat</repositoryLayout>
|
||||
<platforms>
|
||||
<platform>windows</platform>
|
||||
<platform>unix</platform>
|
||||
</platforms>
|
||||
<programs>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.benchmark.byTask.Benchmark</mainClass>
|
||||
<name>Benchmark</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.benchmark.quality.trec.QueryDriver</mainClass>
|
||||
<name>QueryDriver</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.benchmark.quality.utils.QualityQueriesFinder</mainClass>
|
||||
<name>QualityQueriesFinder</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.benchmark.utils.ExtractReuters</mainClass>
|
||||
<name>ExtractReuters</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.benchmark.utils.ExtractWikipedia</mainClass>
|
||||
<name>ExtractWikipedia</name>
|
||||
</program>
|
||||
</programs>
|
||||
</configuration>
|
||||
</plugin>
|
||||
</plugins>
|
||||
</build>
|
||||
</project>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
@ -104,40 +98,6 @@
|
|||
</systemPropertyVariables>
|
||||
</configuration>
|
||||
</plugin>
|
||||
<plugin>
|
||||
<groupId>org.codehaus.mojo</groupId>
|
||||
<artifactId>appassembler-maven-plugin</artifactId>
|
||||
<configuration>
|
||||
<extraJvmArguments>-Xmx128M</extraJvmArguments>
|
||||
<repositoryLayout>flat</repositoryLayout>
|
||||
<platforms>
|
||||
<platform>windows</platform>
|
||||
<platform>unix</platform>
|
||||
</platforms>
|
||||
<programs>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.index.CheckIndex</mainClass>
|
||||
<name>CheckIndex</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.index.IndexReader</mainClass>
|
||||
<name>IndexReader</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.store.LockStressTest</mainClass>
|
||||
<name>LockStressTest</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.store.LockVerifyServer</mainClass>
|
||||
<name>LockVerifyServer</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.util.English</mainClass>
|
||||
<name>English</name>
|
||||
</program>
|
||||
</programs>
|
||||
</configuration>
|
||||
</plugin>
|
||||
<plugin>
|
||||
<groupId>org.codehaus.mojo</groupId>
|
||||
<artifactId>build-helper-maven-plugin</artifactId>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
@ -87,30 +81,5 @@
|
|||
</excludes>
|
||||
</testResource>
|
||||
</testResources>
|
||||
<plugins>
|
||||
<plugin>
|
||||
<groupId>org.codehaus.mojo</groupId>
|
||||
<artifactId>appassembler-maven-plugin</artifactId>
|
||||
<configuration>
|
||||
<extraJvmArguments>-Xmx128M</extraJvmArguments>
|
||||
<repositoryLayout>flat</repositoryLayout>
|
||||
<assembleDirectory>${build-directory}</assembleDirectory>
|
||||
<platforms>
|
||||
<platform>windows</platform>
|
||||
<platform>unix</platform>
|
||||
</platforms>
|
||||
<programs>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.demo.IndexFiles</mainClass>
|
||||
<name>IndexFiles</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.demo.SearchFiles</mainClass>
|
||||
<name>SearchFiles</name>
|
||||
</program>
|
||||
</programs>
|
||||
</configuration>
|
||||
</plugin>
|
||||
</plugins>
|
||||
</build>
|
||||
</project>
|
||||
|
|
|
@ -39,15 +39,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -39,15 +39,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -39,15 +39,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
@ -72,49 +66,5 @@
|
|||
</excludes>
|
||||
</testResource>
|
||||
</testResources>
|
||||
<plugins>
|
||||
<plugin>
|
||||
<groupId>org.codehaus.mojo</groupId>
|
||||
<artifactId>appassembler-maven-plugin</artifactId>
|
||||
<configuration>
|
||||
<extraJvmArguments>-Xmx128M</extraJvmArguments>
|
||||
<repositoryLayout>flat</repositoryLayout>
|
||||
<platforms>
|
||||
<platform>windows</platform>
|
||||
<platform>unix</platform>
|
||||
</platforms>
|
||||
<programs>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.index.FieldNormModifier</mainClass>
|
||||
<name>FieldNormModifier</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.index.IndexSplitter</mainClass>
|
||||
<name>IndexSplitter</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.index.MultiPassIndexSplitter</mainClass>
|
||||
<name>MultiPassIndexSplitter</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.misc.GetTermInfo</mainClass>
|
||||
<name>GetTermInfo</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.misc.HighFreqTerms</mainClass>
|
||||
<name>HighFreqTerms</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.misc.IndexMergeTool</mainClass>
|
||||
<name>IndexMergeTool</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.lucene.misc.LengthNormModifier</mainClass>
|
||||
<name>LengthNormModifier</name>
|
||||
</program>
|
||||
</programs>
|
||||
</configuration>
|
||||
</plugin>
|
||||
</plugins>
|
||||
</build>
|
||||
</project>
|
||||
|
|
|
@ -35,15 +35,9 @@
|
|||
<module-directory>lucene</module-directory>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<modules>
|
||||
<module>core</module>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -31,15 +31,18 @@
|
|||
<version>@version@</version>
|
||||
<packaging>pom</packaging>
|
||||
<name>Grandparent POM for Apache Lucene Core and Apache Solr</name>
|
||||
<description>Parent POM for Apache Lucene Core and Apache Solr</description>
|
||||
<url>http://lucene.apache.org/java</url>
|
||||
<description>Grandparent POM for Apache Lucene Core and Apache Solr</description>
|
||||
<url>http://lucene.apache.org</url>
|
||||
<modules>
|
||||
<module>lucene</module>
|
||||
<module>solr</module>
|
||||
</modules>
|
||||
<properties>
|
||||
<top-level>..</top-level>
|
||||
<base.specification.version>4.0.0</base.specification.version>
|
||||
<vc-anonymous-base-url>http://svn.apache.org/repos/asf/lucene/dev/trunk</vc-anonymous-base-url>
|
||||
<vc-dev-base-url>https://svn.apache.org/repos/asf/lucene/dev/trunk</vc-dev-base-url>
|
||||
<vc-browse-base-url>http://svn.apache.org/viewvc/lucene/dev/trunk</vc-browse-base-url>
|
||||
<base.specification.version>5.0.0</base.specification.version>
|
||||
<maven.build.timestamp.format>yyyy-MM-dd HH:mm:ss</maven.build.timestamp.format>
|
||||
<java.compat.version>1.6</java.compat.version>
|
||||
<jetty.version>8.1.2.v20120308</jetty.version>
|
||||
|
@ -69,11 +72,11 @@
|
|||
</properties>
|
||||
<issueManagement>
|
||||
<system>JIRA</system>
|
||||
<url>http://issues.apache.org/jira/browse/LUCENE</url>
|
||||
<url>https://issues.apache.org/jira/browse/LUCENE</url>
|
||||
</issueManagement>
|
||||
<ciManagement>
|
||||
<system>Hudson</system>
|
||||
<url>http://lucene.zones.apache.org:8080/hudson/job/Lucene-Nightly/</url>
|
||||
<system>Jenkins</system>
|
||||
<url>https://builds.apache.org/computer/lucene/</url>
|
||||
</ciManagement>
|
||||
<mailingLists>
|
||||
<mailingList>
|
||||
|
@ -109,15 +112,9 @@
|
|||
</mailingLists>
|
||||
<inceptionYear>2000</inceptionYear>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}</developerConnection>
|
||||
<url>${vc-browse-base-url}</url>
|
||||
</scm>
|
||||
<licenses>
|
||||
<license>
|
||||
|
@ -298,7 +295,7 @@
|
|||
<dependency>
|
||||
<groupId>org.apache.zookeeper</groupId>
|
||||
<artifactId>zookeeper</artifactId>
|
||||
<version>3.3.5</version>
|
||||
<version>3.3.6</version>
|
||||
</dependency>
|
||||
<dependency>
|
||||
<groupId>org.carrot2</groupId>
|
||||
|
@ -549,11 +546,6 @@
|
|||
</archive>
|
||||
</configuration>
|
||||
</plugin>
|
||||
<plugin>
|
||||
<groupId>org.codehaus.mojo</groupId>
|
||||
<artifactId>appassembler-maven-plugin</artifactId>
|
||||
<version>1.2.1</version>
|
||||
</plugin>
|
||||
<plugin>
|
||||
<groupId>org.codehaus.mojo</groupId>
|
||||
<artifactId>build-helper-maven-plugin</artifactId>
|
||||
|
|
|
@ -38,15 +38,9 @@
|
|||
<surefire-top-level>${top-level}/../..</surefire-top-level>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -38,15 +38,9 @@
|
|||
<surefire-top-level>${top-level}/../..</surefire-top-level>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -38,15 +38,9 @@
|
|||
<surefire-top-level>${top-level}/../..</surefire-top-level>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -38,15 +38,9 @@
|
|||
<surefire-top-level>${top-level}/../..</surefire-top-level>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -41,15 +41,9 @@
|
|||
<surefire-top-level>${top-level}/../..</surefire-top-level>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -42,15 +42,9 @@
|
|||
<surefire-top-level>${top-level}/../..</surefire-top-level>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -38,15 +38,9 @@
|
|||
<surefire-top-level>${top-level}/../..</surefire-top-level>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -38,15 +38,9 @@
|
|||
<surefire-top-level>${top-level}/../..</surefire-top-level>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -38,15 +38,9 @@
|
|||
<surefire-top-level>${top-level}/../..</surefire-top-level>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
@ -254,37 +248,6 @@
|
|||
</systemPropertyVariables>
|
||||
</configuration>
|
||||
</plugin>
|
||||
<plugin>
|
||||
<groupId>org.codehaus.mojo</groupId>
|
||||
<artifactId>appassembler-maven-plugin</artifactId>
|
||||
<configuration>
|
||||
<extraJvmArguments>-Xmx128M</extraJvmArguments>
|
||||
<repositoryLayout>flat</repositoryLayout>
|
||||
<platforms>
|
||||
<platform>windows</platform>
|
||||
<platform>unix</platform>
|
||||
</platforms>
|
||||
<programs>
|
||||
<program>
|
||||
<mainClass>org.apache.solr.client.solrj.embedded.JettySolrRunner</mainClass>
|
||||
<name>JettySolrRunner</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.solr.util.BitSetPerf</mainClass>
|
||||
<name>BitSetPerf</name>
|
||||
<extraJvmArguments>-Xms128m -Xbatch</extraJvmArguments>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.solr.util.SimplePostTool</mainClass>
|
||||
<name>SimplePostTool</name>
|
||||
</program>
|
||||
<program>
|
||||
<mainClass>org.apache.solr.util.SuggestMissingFactories</mainClass>
|
||||
<name>SuggestMissingFactories</name>
|
||||
</program>
|
||||
</programs>
|
||||
</configuration>
|
||||
</plugin>
|
||||
<plugin>
|
||||
<groupId>org.codehaus.mojo</groupId>
|
||||
<artifactId>build-helper-maven-plugin</artifactId>
|
||||
|
|
|
@ -43,26 +43,14 @@
|
|||
<module-directory>solr</module-directory>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<issueManagement>
|
||||
<system>JIRA</system>
|
||||
<url>http://issues.apache.org/jira/browse/SOLR</url>
|
||||
<url>https://issues.apache.org/jira/browse/SOLR</url>
|
||||
</issueManagement>
|
||||
<ciManagement>
|
||||
<system>Hudson</system>
|
||||
<url>
|
||||
http://lucene.zones.apache.org:8080/hudson/job/Solr-Nightly/
|
||||
</url>
|
||||
</ciManagement>
|
||||
<mailingLists>
|
||||
<mailingList>
|
||||
<name>Solr User List</name>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<!-- These dependencies are compile scope because this is a test framework. -->
|
||||
|
@ -60,20 +54,27 @@
|
|||
<artifactId>solr-core</artifactId>
|
||||
<version>${project.version}</version>
|
||||
</dependency>
|
||||
<dependency>
|
||||
<groupId>javax.servlet</groupId>
|
||||
<artifactId>servlet-api</artifactId>
|
||||
</dependency>
|
||||
<dependency>
|
||||
<groupId>junit</groupId>
|
||||
<artifactId>junit</artifactId>
|
||||
</dependency>
|
||||
<!-- If your tests don't use BaseDistributedSearchTestCase or SolrJettyTestBase,
|
||||
you can exclude the three Jetty dependencies below. -->
|
||||
<dependency>
|
||||
<groupId>org.eclipse.jetty</groupId>
|
||||
<artifactId>jetty-server</artifactId>
|
||||
<scope>runtime</scope>
|
||||
<artifactId>jetty-servlet</artifactId>
|
||||
</dependency>
|
||||
<dependency>
|
||||
<groupId>org.eclipse.jetty</groupId>
|
||||
<artifactId>jetty-util</artifactId>
|
||||
</dependency>
|
||||
<!-- If your tests don't use BaseDistributedSearchTestCase or SolrJettyTestBase,
|
||||
you can exclude the two Jetty dependencies below. -->
|
||||
<dependency>
|
||||
<groupId>org.eclipse.jetty</groupId>
|
||||
<artifactId>jetty-server</artifactId>
|
||||
<scope>runtime</scope>
|
||||
</dependency>
|
||||
<dependency>
|
||||
|
|
|
@ -37,15 +37,9 @@
|
|||
<module-path>${top-level}/${module-directory}</module-path>
|
||||
</properties>
|
||||
<scm>
|
||||
<connection>
|
||||
scm:svn:http://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</connection>
|
||||
<developerConnection>
|
||||
scm:svn:https://svn.apache.org/repos/asf/lucene/dev/trunk/${module-directory}
|
||||
</developerConnection>
|
||||
<url>
|
||||
http://svn.apache.org/viewvc/lucene/dev/trunk/${module-directory}
|
||||
</url>
|
||||
<connection>scm:svn:${vc-anonymous-base-url}/${module-directory}</connection>
|
||||
<developerConnection>scm:svn:${vc-dev-base-url}/${module-directory}</developerConnection>
|
||||
<url>${vc-browse-base-url}/${module-directory}</url>
|
||||
</scm>
|
||||
<dependencies>
|
||||
<dependency>
|
||||
|
|
|
@ -23,7 +23,7 @@ reMarkup = re.compile('<.*?>')
|
|||
|
||||
def checkSummary(fullPath):
|
||||
printed = False
|
||||
f = open(fullPath)
|
||||
f = open(fullPath, encoding='UTF-8')
|
||||
anyMissing = False
|
||||
sawPackage = False
|
||||
desc = []
|
||||
|
@ -41,10 +41,10 @@ def checkSummary(fullPath):
|
|||
desc = desc.strip()
|
||||
if desc == '':
|
||||
if not printed:
|
||||
print
|
||||
print fullPath
|
||||
print()
|
||||
print(fullPath)
|
||||
printed = True
|
||||
print ' no package description (missing package.html in src?)'
|
||||
print(' no package description (missing package.html in src?)')
|
||||
anyMissing = True
|
||||
desc = None
|
||||
else:
|
||||
|
@ -52,17 +52,17 @@ def checkSummary(fullPath):
|
|||
|
||||
if lineLower in ('<td> </td>', '<td></td>', '<td class="collast"> </td>'):
|
||||
if not printed:
|
||||
print
|
||||
print fullPath
|
||||
print()
|
||||
print(fullPath)
|
||||
printed = True
|
||||
print ' missing: %s' % unescapeHTML(lastHREF)
|
||||
print(' missing: %s' % unescapeHTML(lastHREF))
|
||||
anyMissing = True
|
||||
elif lineLower.find('licensed to the apache software foundation') != -1 or lineLower.find('copyright 2004 the apache software foundation') != -1:
|
||||
if not printed:
|
||||
print
|
||||
print fullPath
|
||||
print()
|
||||
print(fullPath)
|
||||
printed = True
|
||||
print ' license-is-javadoc: %s' % unescapeHTML(lastHREF)
|
||||
print(' license-is-javadoc: %s' % unescapeHTML(lastHREF))
|
||||
anyMissing = True
|
||||
m = reHREF.search(line)
|
||||
if m is not None:
|
||||
|
@ -85,17 +85,17 @@ def checkPackageSummaries(root, level='class'):
|
|||
"""
|
||||
|
||||
if level != 'class' and level != 'package':
|
||||
print 'unsupported level: %s, must be "class" or "package"' % level
|
||||
print('unsupported level: %s, must be "class" or "package"' % level)
|
||||
sys.exit(1)
|
||||
|
||||
#for dirPath, dirNames, fileNames in os.walk('%s/lucene/build/docs/api' % root):
|
||||
|
||||
if False:
|
||||
os.chdir(root)
|
||||
print
|
||||
print 'Run "ant javadocs" > javadocs.log...'
|
||||
print()
|
||||
print('Run "ant javadocs" > javadocs.log...')
|
||||
if os.system('ant javadocs > javadocs.log 2>&1'):
|
||||
print ' FAILED'
|
||||
print(' FAILED')
|
||||
sys.exit(1)
|
||||
|
||||
anyMissing = False
|
||||
|
@ -116,14 +116,14 @@ def checkPackageSummaries(root, level='class'):
|
|||
|
||||
if __name__ == '__main__':
|
||||
if len(sys.argv) < 2 or len(sys.argv) > 3:
|
||||
print 'usage: %s <dir> [class|package]' % sys.argv[0]
|
||||
print('usage: %s <dir> [class|package]' % sys.argv[0])
|
||||
sys.exit(1)
|
||||
if len(sys.argv) == 2:
|
||||
level = 'class'
|
||||
else:
|
||||
level = sys.argv[2]
|
||||
if checkPackageSummaries(sys.argv[1], level):
|
||||
print
|
||||
print 'Missing javadocs were found!'
|
||||
print()
|
||||
print('Missing javadocs were found!')
|
||||
sys.exit(1)
|
||||
sys.exit(0)
|
||||
|
|
|
@ -20,12 +20,12 @@ import subprocess
|
|||
import signal
|
||||
import shutil
|
||||
import hashlib
|
||||
import httplib
|
||||
import http.client
|
||||
import re
|
||||
import urllib2
|
||||
import urlparse
|
||||
import urllib.request, urllib.error, urllib.parse
|
||||
import urllib.parse
|
||||
import sys
|
||||
import HTMLParser
|
||||
import html.parser
|
||||
from collections import defaultdict
|
||||
import xml.etree.ElementTree as ET
|
||||
import filecmp
|
||||
|
@ -38,9 +38,9 @@ import checkJavadocLinks
|
|||
# tested on Linux and on Cygwin under Windows 7.
|
||||
|
||||
def unshortenURL(url):
|
||||
parsed = urlparse.urlparse(url)
|
||||
parsed = urllib.parse.urlparse(url)
|
||||
if parsed[0] in ('http', 'https'):
|
||||
h = httplib.HTTPConnection(parsed.netloc)
|
||||
h = http.client.HTTPConnection(parsed.netloc)
|
||||
h.request('HEAD', parsed.path)
|
||||
response = h.getresponse()
|
||||
if response.status/100 == 3 and response.getheader('Location'):
|
||||
|
@ -101,8 +101,8 @@ def getHREFs(urlString):
|
|||
|
||||
# Deref any redirects
|
||||
while True:
|
||||
url = urlparse.urlparse(urlString)
|
||||
h = httplib.HTTPConnection(url.netloc)
|
||||
url = urllib.parse.urlparse(urlString)
|
||||
h = http.client.HTTPConnection(url.netloc)
|
||||
h.request('GET', url.path)
|
||||
r = h.getresponse()
|
||||
newLoc = r.getheader('location')
|
||||
|
@ -112,8 +112,8 @@ def getHREFs(urlString):
|
|||
break
|
||||
|
||||
links = []
|
||||
for subUrl, text in reHREF.findall(urllib2.urlopen(urlString).read()):
|
||||
fullURL = urlparse.urljoin(urlString, subUrl)
|
||||
for subUrl, text in reHREF.findall(urllib.request.urlopen(urlString).read().decode('UTF-8')):
|
||||
fullURL = urllib.parse.urljoin(urlString, subUrl)
|
||||
links.append((text, fullURL))
|
||||
return links
|
||||
|
||||
|
@ -121,15 +121,15 @@ def download(name, urlString, tmpDir, quiet=False):
|
|||
fileName = '%s/%s' % (tmpDir, name)
|
||||
if DEBUG and os.path.exists(fileName):
|
||||
if not quiet and fileName.find('.asc') == -1:
|
||||
print ' already done: %.1f MB' % (os.path.getsize(fileName)/1024./1024.)
|
||||
print(' already done: %.1f MB' % (os.path.getsize(fileName)/1024./1024.))
|
||||
return
|
||||
fIn = urllib2.urlopen(urlString)
|
||||
fIn = urllib.request.urlopen(urlString)
|
||||
fOut = open(fileName, 'wb')
|
||||
success = False
|
||||
try:
|
||||
while True:
|
||||
s = fIn.read(65536)
|
||||
if s == '':
|
||||
if s == b'':
|
||||
break
|
||||
fOut.write(s)
|
||||
fOut.close()
|
||||
|
@ -141,14 +141,14 @@ def download(name, urlString, tmpDir, quiet=False):
|
|||
if not success:
|
||||
os.remove(fileName)
|
||||
if not quiet and fileName.find('.asc') == -1:
|
||||
print ' %.1f MB' % (os.path.getsize(fileName)/1024./1024.)
|
||||
print(' %.1f MB' % (os.path.getsize(fileName)/1024./1024.))
|
||||
|
||||
def load(urlString):
|
||||
return urllib2.urlopen(urlString).read()
|
||||
return urllib.request.urlopen(urlString).read().decode('utf-8')
|
||||
|
||||
def checkSigs(project, urlString, version, tmpDir, isSigned):
|
||||
|
||||
print ' test basics...'
|
||||
print(' test basics...')
|
||||
ents = getDirEntries(urlString)
|
||||
artifact = None
|
||||
keysURL = None
|
||||
|
@ -210,7 +210,7 @@ def checkSigs(project, urlString, version, tmpDir, isSigned):
|
|||
if keysURL is None:
|
||||
raise RuntimeError('%s is missing KEYS' % project)
|
||||
|
||||
print ' get KEYS'
|
||||
print(' get KEYS')
|
||||
download('%s.KEYS' % project, keysURL, tmpDir)
|
||||
|
||||
keysFile = '%s/%s.KEYS' % (tmpDir, project)
|
||||
|
@ -219,7 +219,7 @@ def checkSigs(project, urlString, version, tmpDir, isSigned):
|
|||
gpgHomeDir = '%s/%s.gpg' % (tmpDir, project)
|
||||
if os.path.exists(gpgHomeDir):
|
||||
shutil.rmtree(gpgHomeDir)
|
||||
os.makedirs(gpgHomeDir, 0700)
|
||||
os.makedirs(gpgHomeDir, 0o700)
|
||||
run('gpg --homedir %s --import %s' % (gpgHomeDir, keysFile),
|
||||
'%s/%s.gpg.import.log 2>&1' % (tmpDir, project))
|
||||
|
||||
|
@ -232,12 +232,12 @@ def checkSigs(project, urlString, version, tmpDir, isSigned):
|
|||
testChanges(project, version, changesURL)
|
||||
|
||||
for artifact, urlString in artifacts:
|
||||
print ' download %s...' % artifact
|
||||
print(' download %s...' % artifact)
|
||||
download(artifact, urlString, tmpDir)
|
||||
verifyDigests(artifact, urlString, tmpDir)
|
||||
|
||||
if isSigned:
|
||||
print ' verify sig'
|
||||
print(' verify sig')
|
||||
# Test sig (this is done with a clean brand-new GPG world)
|
||||
download(artifact + '.asc', urlString + '.asc', tmpDir)
|
||||
sigFile = '%s/%s.asc' % (tmpDir, artifact)
|
||||
|
@ -246,28 +246,28 @@ def checkSigs(project, urlString, version, tmpDir, isSigned):
|
|||
run('gpg --homedir %s --verify %s %s' % (gpgHomeDir, sigFile, artifactFile),
|
||||
logFile)
|
||||
# Forward any GPG warnings, except the expected one (since its a clean world)
|
||||
f = open(logFile, 'rb')
|
||||
f = open(logFile, encoding='UTF-8')
|
||||
for line in f.readlines():
|
||||
if line.lower().find('warning') != -1 \
|
||||
and line.find('WARNING: This key is not certified with a trusted signature') == -1:
|
||||
print ' GPG: %s' % line.strip()
|
||||
print(' GPG: %s' % line.strip())
|
||||
f.close()
|
||||
|
||||
# Test trust (this is done with the real users config)
|
||||
run('gpg --import %s' % (keysFile),
|
||||
'%s/%s.gpg.trust.import.log 2>&1' % (tmpDir, project))
|
||||
print ' verify trust'
|
||||
print(' verify trust')
|
||||
logFile = '%s/%s.%s.gpg.trust.log' % (tmpDir, project, artifact)
|
||||
run('gpg --verify %s %s' % (sigFile, artifactFile), logFile)
|
||||
# Forward any GPG warnings:
|
||||
f = open(logFile, 'rb')
|
||||
f = open(logFile, encoding='UTF-8')
|
||||
for line in f.readlines():
|
||||
if line.lower().find('warning') != -1:
|
||||
print ' GPG: %s' % line.strip()
|
||||
print(' GPG: %s' % line.strip())
|
||||
f.close()
|
||||
|
||||
def testChanges(project, version, changesURLString):
|
||||
print ' check changes HTML...'
|
||||
print(' check changes HTML...')
|
||||
changesURL = None
|
||||
for text, subURL in getDirEntries(changesURLString):
|
||||
if text == 'Changes.html':
|
||||
|
@ -287,7 +287,7 @@ def testChangesText(dir, version, project):
|
|||
if 'CHANGES.txt' in files:
|
||||
fullPath = '%s/CHANGES.txt' % root
|
||||
#print 'CHECK %s' % fullPath
|
||||
checkChangesContent(open(fullPath).read(), version, fullPath, project, False)
|
||||
checkChangesContent(open(fullPath, encoding='UTF-8').read(), version, fullPath, project, False)
|
||||
|
||||
def checkChangesContent(s, version, name, project, isHTML):
|
||||
|
||||
|
@ -336,7 +336,7 @@ def run(command, logFile):
|
|||
raise RuntimeError('command "%s" failed; see log file %s' % (command, logPath))
|
||||
|
||||
def verifyDigests(artifact, urlString, tmpDir):
|
||||
print ' verify md5/sha1 digests'
|
||||
print(' verify md5/sha1 digests')
|
||||
md5Expected, t = load(urlString + '.md5').strip().split()
|
||||
if t != '*'+artifact:
|
||||
raise RuntimeError('MD5 %s.md5 lists artifact %s but expected *%s' % (urlString, t, artifact))
|
||||
|
@ -347,10 +347,10 @@ def verifyDigests(artifact, urlString, tmpDir):
|
|||
|
||||
m = hashlib.md5()
|
||||
s = hashlib.sha1()
|
||||
f = open('%s/%s' % (tmpDir, artifact))
|
||||
f = open('%s/%s' % (tmpDir, artifact), 'rb')
|
||||
while True:
|
||||
x = f.read(65536)
|
||||
if x == '':
|
||||
if len(x) == 0:
|
||||
break
|
||||
m.update(x)
|
||||
s.update(x)
|
||||
|
@ -363,6 +363,10 @@ def verifyDigests(artifact, urlString, tmpDir):
|
|||
raise RuntimeError('SHA1 digest mismatch for %s: expected %s but got %s' % (artifact, sha1Expected, sha1Actual))
|
||||
|
||||
def getDirEntries(urlString):
|
||||
if urlString.startswith('file:/') and not urlString.startswith('file://'):
|
||||
# stupid bogus ant URI
|
||||
urlString = "file:///" + urlString[6:]
|
||||
|
||||
if urlString.startswith('file://'):
|
||||
path = urlString[7:]
|
||||
if path.endswith('/'):
|
||||
|
@ -388,7 +392,7 @@ def unpack(project, tmpDir, artifact, version):
|
|||
shutil.rmtree(destDir)
|
||||
os.makedirs(destDir)
|
||||
os.chdir(destDir)
|
||||
print ' unpack %s...' % artifact
|
||||
print(' unpack %s...' % artifact)
|
||||
unpackLogFile = '%s/%s-unpack-%s.log' % (tmpDir, project, artifact)
|
||||
if artifact.endswith('.tar.gz') or artifact.endswith('.tgz'):
|
||||
run('tar xzf %s/%s' % (tmpDir, artifact), unpackLogFile)
|
||||
|
@ -437,12 +441,14 @@ def verifyUnpacked(project, artifact, unpackPath, version, tmpDir):
|
|||
|
||||
if project == 'lucene':
|
||||
# TODO: clean this up to not be a list of modules that we must maintain
|
||||
extras = ('analysis', 'benchmark', 'core', 'demo', 'docs', 'facet', 'grouping', 'highlighter', 'join', 'memory', 'misc', 'queries', 'queryparser', 'sandbox', 'spatial', 'suggest', 'test-framework')
|
||||
extras = ('analysis', 'benchmark', 'core', 'demo', 'docs', 'facet', 'grouping', 'highlighter', 'join', 'memory', 'misc', 'queries', 'queryparser', 'sandbox', 'spatial', 'suggest', 'test-framework', 'licenses')
|
||||
if isSrc:
|
||||
extras += ('build.xml', 'common-build.xml', 'module-build.xml', 'ivy-settings.xml', 'backwards', 'tools', 'site')
|
||||
else:
|
||||
extras = ()
|
||||
|
||||
# TODO: if solr, verify lucene/licenses, solr/licenses are present
|
||||
|
||||
for e in extras:
|
||||
if e not in l:
|
||||
raise RuntimeError('%s: %s missing from artifact %s' % (project, e, artifact))
|
||||
|
@ -453,81 +459,81 @@ def verifyUnpacked(project, artifact, unpackPath, version, tmpDir):
|
|||
raise RuntimeError('%s: unexpected files/dirs in artifact %s: %s' % (project, artifact, l))
|
||||
|
||||
if isSrc:
|
||||
print ' make sure no JARs/WARs in src dist...'
|
||||
print(' make sure no JARs/WARs in src dist...')
|
||||
lines = os.popen('find . -name \\*.jar').readlines()
|
||||
if len(lines) != 0:
|
||||
print ' FAILED:'
|
||||
print(' FAILED:')
|
||||
for line in lines:
|
||||
print ' %s' % line.strip()
|
||||
print(' %s' % line.strip())
|
||||
raise RuntimeError('source release has JARs...')
|
||||
lines = os.popen('find . -name \\*.war').readlines()
|
||||
if len(lines) != 0:
|
||||
print ' FAILED:'
|
||||
print(' FAILED:')
|
||||
for line in lines:
|
||||
print ' %s' % line.strip()
|
||||
print(' %s' % line.strip())
|
||||
raise RuntimeError('source release has WARs...')
|
||||
|
||||
print ' run "ant validate"'
|
||||
print(' run "ant validate"')
|
||||
run('%s; ant validate' % javaExe('1.7'), '%s/validate.log' % unpackPath)
|
||||
|
||||
if project == 'lucene':
|
||||
print ' run tests w/ Java 6...'
|
||||
print(' run tests w/ Java 6...')
|
||||
run('%s; ant test' % javaExe('1.6'), '%s/test.log' % unpackPath)
|
||||
run('%s; ant jar' % javaExe('1.6'), '%s/compile.log' % unpackPath)
|
||||
testDemo(isSrc, version)
|
||||
# test javadocs
|
||||
print ' generate javadocs w/ Java 6...'
|
||||
print(' generate javadocs w/ Java 6...')
|
||||
run('%s; ant javadocs' % javaExe('1.6'), '%s/javadocs.log' % unpackPath)
|
||||
checkJavadocpath('%s/build/docs' % unpackPath)
|
||||
else:
|
||||
print ' run tests w/ Java 6...'
|
||||
print(' run tests w/ Java 6...')
|
||||
run('%s; ant test' % javaExe('1.6'), '%s/test.log' % unpackPath)
|
||||
|
||||
# test javadocs
|
||||
print ' generate javadocs w/ Java 6...'
|
||||
print(' generate javadocs w/ Java 6...')
|
||||
run('%s; ant javadocs' % javaExe('1.6'), '%s/javadocs.log' % unpackPath)
|
||||
checkJavadocpath('%s/build/docs' % unpackPath)
|
||||
|
||||
print ' run tests w/ Java 7...'
|
||||
print(' run tests w/ Java 7...')
|
||||
run('%s; ant test' % javaExe('1.7'), '%s/test.log' % unpackPath)
|
||||
|
||||
# test javadocs
|
||||
print ' generate javadocs w/ Java 7...'
|
||||
print(' generate javadocs w/ Java 7...')
|
||||
run('%s; ant javadocs' % javaExe('1.7'), '%s/javadocs.log' % unpackPath)
|
||||
checkJavadocpath('%s/build/docs' % unpackPath)
|
||||
|
||||
os.chdir('solr')
|
||||
print ' test solr example w/ Java 6...'
|
||||
print(' test solr example w/ Java 6...')
|
||||
run('%s; ant clean example' % javaExe('1.6'), '%s/antexample.log' % unpackPath)
|
||||
testSolrExample(unpackPath, JAVA6_HOME, True)
|
||||
|
||||
print ' test solr example w/ Java 7...'
|
||||
print(' test solr example w/ Java 7...')
|
||||
run('%s; ant clean example' % javaExe('1.7'), '%s/antexample.log' % unpackPath)
|
||||
testSolrExample(unpackPath, JAVA7_HOME, True)
|
||||
os.chdir('..')
|
||||
|
||||
print ' check NOTICE'
|
||||
print(' check NOTICE')
|
||||
testNotice(unpackPath)
|
||||
|
||||
else:
|
||||
if project == 'lucene':
|
||||
testDemo(isSrc, version)
|
||||
else:
|
||||
print ' test solr example w/ Java 6...'
|
||||
print(' test solr example w/ Java 6...')
|
||||
testSolrExample(unpackPath, JAVA6_HOME, False)
|
||||
|
||||
print ' test solr example w/ Java 7...'
|
||||
print(' test solr example w/ Java 7...')
|
||||
testSolrExample(unpackPath, JAVA7_HOME, False)
|
||||
|
||||
testChangesText('.', version, project)
|
||||
|
||||
if project == 'lucene' and not isSrc:
|
||||
print ' check Lucene\'s javadoc JAR'
|
||||
print(' check Lucene\'s javadoc JAR')
|
||||
checkJavadocpath('%s/docs' % unpackPath)
|
||||
|
||||
def testNotice(unpackPath):
|
||||
solrNotice = open('%s/NOTICE.txt' % unpackPath).read()
|
||||
luceneNotice = open('%s/lucene/NOTICE.txt' % unpackPath).read()
|
||||
solrNotice = open('%s/NOTICE.txt' % unpackPath, encoding='UTF-8').read()
|
||||
luceneNotice = open('%s/lucene/NOTICE.txt' % unpackPath, encoding='UTF-8').read()
|
||||
|
||||
expected = """
|
||||
=========================================================================
|
||||
|
@ -545,12 +551,12 @@ def readSolrOutput(p, startupEvent, logFile):
|
|||
try:
|
||||
while True:
|
||||
line = p.readline()
|
||||
if line == '':
|
||||
if len(line) == 0:
|
||||
break
|
||||
f.write(line)
|
||||
f.flush()
|
||||
# print 'SOLR: %s' % line.strip()
|
||||
if line.find('Started SocketConnector@0.0.0.0:8983') != -1:
|
||||
if line.decode('UTF-8').find('Started SocketConnector@0.0.0.0:8983') != -1:
|
||||
startupEvent.set()
|
||||
finally:
|
||||
f.close()
|
||||
|
@ -558,7 +564,7 @@ def readSolrOutput(p, startupEvent, logFile):
|
|||
def testSolrExample(unpackPath, javaPath, isSrc):
|
||||
logFile = '%s/solr-example.log' % unpackPath
|
||||
os.chdir('example')
|
||||
print ' start Solr instance (log=%s)...' % logFile
|
||||
print(' start Solr instance (log=%s)...' % logFile)
|
||||
env = {}
|
||||
env.update(os.environ)
|
||||
env['JAVA_HOME'] = javaPath
|
||||
|
@ -572,21 +578,21 @@ def testSolrExample(unpackPath, javaPath, isSrc):
|
|||
|
||||
# Make sure Solr finishes startup:
|
||||
startupEvent.wait()
|
||||
print ' startup done'
|
||||
print(' startup done')
|
||||
|
||||
try:
|
||||
print ' test utf8...'
|
||||
print(' test utf8...')
|
||||
run('sh ./exampledocs/test_utf8.sh', 'utf8.log')
|
||||
print ' index example docs...'
|
||||
print(' index example docs...')
|
||||
run('sh ./exampledocs/post.sh ./exampledocs/*.xml', 'post-example-docs.log')
|
||||
print ' run query...'
|
||||
s = urllib2.urlopen('http://localhost:8983/solr/select/?q=video').read()
|
||||
print(' run query...')
|
||||
s = urllib.request.urlopen('http://localhost:8983/solr/select/?q=video').read().decode('UTF-8')
|
||||
if s.find('<result name="response" numFound="3" start="0">') == -1:
|
||||
print 'FAILED: response is:\n%s' % s
|
||||
print('FAILED: response is:\n%s' % s)
|
||||
raise RuntimeError('query on solr example instance failed')
|
||||
finally:
|
||||
# Stop server:
|
||||
print ' stop server (SIGINT)...'
|
||||
print(' stop server (SIGINT)...')
|
||||
os.kill(server.pid, signal.SIGINT)
|
||||
|
||||
# Give it 10 seconds to gracefully shut down
|
||||
|
@ -594,14 +600,14 @@ def testSolrExample(unpackPath, javaPath, isSrc):
|
|||
|
||||
if serverThread.isAlive():
|
||||
# Kill server:
|
||||
print '***WARNING***: Solr instance didn\'t respond to SIGINT; using SIGKILL now...'
|
||||
print('***WARNING***: Solr instance didn\'t respond to SIGINT; using SIGKILL now...')
|
||||
os.kill(server.pid, signal.SIGKILL)
|
||||
|
||||
serverThread.join(10.0)
|
||||
|
||||
if serverThread.isAlive():
|
||||
# Shouldn't happen unless something is seriously wrong...
|
||||
print '***WARNING***: Solr instance didn\'t respond to SIGKILL; ignoring...'
|
||||
print('***WARNING***: Solr instance didn\'t respond to SIGKILL; ignoring...')
|
||||
|
||||
os.chdir('..')
|
||||
|
||||
|
@ -615,13 +621,13 @@ def checkJavadocpath(path):
|
|||
if checkJavaDocs.checkPackageSummaries(path):
|
||||
# disabled: RM cannot fix all this, see LUCENE-3887
|
||||
# raise RuntimeError('javadoc problems')
|
||||
print '\n***WARNING***: javadocs want to fail!\n'
|
||||
print('\n***WARNING***: javadocs want to fail!\n')
|
||||
|
||||
if checkJavadocLinks.checkAll(path):
|
||||
raise RuntimeError('broken javadocs links found!')
|
||||
|
||||
def testDemo(isSrc, version):
|
||||
print ' test demo...'
|
||||
print(' test demo...')
|
||||
sep = ';' if cygwin else ':'
|
||||
if isSrc:
|
||||
cp = 'build/core/classes/java{0}build/demo/classes/java{0}build/analysis/common/classes/java{0}build/queryparser/classes/java'.format(sep)
|
||||
|
@ -632,14 +638,14 @@ def testDemo(isSrc, version):
|
|||
run('%s; java -cp "%s" org.apache.lucene.demo.IndexFiles -index index -docs %s' % (javaExe('1.6'), cp, docsDir), 'index.log')
|
||||
run('%s; java -cp "%s" org.apache.lucene.demo.SearchFiles -index index -query lucene' % (javaExe('1.6'), cp), 'search.log')
|
||||
reMatchingDocs = re.compile('(\d+) total matching documents')
|
||||
m = reMatchingDocs.search(open('search.log', 'rb').read())
|
||||
m = reMatchingDocs.search(open('search.log', encoding='UTF-8').read())
|
||||
if m is None:
|
||||
raise RuntimeError('lucene demo\'s SearchFiles found no results')
|
||||
else:
|
||||
numHits = int(m.group(1))
|
||||
if numHits < 100:
|
||||
raise RuntimeError('lucene demo\'s SearchFiles found too few results: %s' % numHits)
|
||||
print ' got %d hits for query "lucene"' % numHits
|
||||
print(' got %d hits for query "lucene"' % numHits)
|
||||
|
||||
def checkMaven(baseURL, tmpDir, version, isSigned):
|
||||
# Locate the release branch in subversion
|
||||
|
@ -652,11 +658,11 @@ def checkMaven(baseURL, tmpDir, version, isSigned):
|
|||
if text == releaseBranchText:
|
||||
releaseBranchSvnURL = subURL
|
||||
|
||||
print ' get POM templates',
|
||||
print(' get POM templates', end=' ')
|
||||
POMtemplates = defaultdict()
|
||||
getPOMtemplates(POMtemplates, tmpDir, releaseBranchSvnURL)
|
||||
print
|
||||
print ' download artifacts',
|
||||
print()
|
||||
print(' download artifacts', end=' ')
|
||||
artifacts = {'lucene': [], 'solr': []}
|
||||
for project in ('lucene', 'solr'):
|
||||
artifactsURL = '%s/%s/maven/org/apache/%s' % (baseURL, project, project)
|
||||
|
@ -664,30 +670,30 @@ def checkMaven(baseURL, tmpDir, version, isSigned):
|
|||
if not os.path.exists(targetDir):
|
||||
os.makedirs(targetDir)
|
||||
crawl(artifacts[project], artifactsURL, targetDir)
|
||||
print
|
||||
print ' verify that each binary artifact has a deployed POM...'
|
||||
print()
|
||||
print(' verify that each binary artifact has a deployed POM...')
|
||||
verifyPOMperBinaryArtifact(artifacts, version)
|
||||
print ' verify that there is an artifact for each POM template...'
|
||||
print(' verify that there is an artifact for each POM template...')
|
||||
verifyArtifactPerPOMtemplate(POMtemplates, artifacts, tmpDir, version)
|
||||
print " verify Maven artifacts' md5/sha1 digests..."
|
||||
print(" verify Maven artifacts' md5/sha1 digests...")
|
||||
verifyMavenDigests(artifacts)
|
||||
print ' verify that all non-Mavenized deps are deployed...'
|
||||
print(' verify that all non-Mavenized deps are deployed...')
|
||||
nonMavenizedDeps = dict()
|
||||
checkNonMavenizedDeps(nonMavenizedDeps, POMtemplates, artifacts, tmpDir,
|
||||
version, releaseBranchSvnURL)
|
||||
print ' check for javadoc and sources artifacts...'
|
||||
print(' check for javadoc and sources artifacts...')
|
||||
checkJavadocAndSourceArtifacts(nonMavenizedDeps, artifacts, version)
|
||||
print " verify deployed POMs' coordinates..."
|
||||
print(" verify deployed POMs' coordinates...")
|
||||
verifyDeployedPOMsCoordinates(artifacts, version)
|
||||
if isSigned:
|
||||
print ' verify maven artifact sigs',
|
||||
print(' verify maven artifact sigs', end=' ')
|
||||
verifyMavenSigs(baseURL, tmpDir, artifacts)
|
||||
|
||||
distributionFiles = getDistributionsForMavenChecks(tmpDir, version, baseURL)
|
||||
|
||||
print ' verify that non-Mavenized deps are same as in the binary distribution...'
|
||||
print(' verify that non-Mavenized deps are same as in the binary distribution...')
|
||||
checkIdenticalNonMavenizedDeps(distributionFiles, nonMavenizedDeps)
|
||||
print ' verify that Maven artifacts are same as in the binary distribution...'
|
||||
print(' verify that Maven artifacts are same as in the binary distribution...')
|
||||
checkIdenticalMavenArtifacts(distributionFiles, nonMavenizedDeps, artifacts, version)
|
||||
|
||||
def getDistributionsForMavenChecks(tmpDir, version, baseURL):
|
||||
|
@ -697,19 +703,19 @@ def getDistributionsForMavenChecks(tmpDir, version, baseURL):
|
|||
if project == 'solr': distribution = 'apache-' + distribution
|
||||
if not os.path.exists('%s/%s' % (tmpDir, distribution)):
|
||||
distURL = '%s/%s/%s' % (baseURL, project, distribution)
|
||||
print ' download %s...' % distribution,
|
||||
print(' download %s...' % distribution, end=' ')
|
||||
download(distribution, distURL, tmpDir)
|
||||
destDir = '%s/unpack-%s-maven' % (tmpDir, project)
|
||||
if os.path.exists(destDir):
|
||||
shutil.rmtree(destDir)
|
||||
os.makedirs(destDir)
|
||||
os.chdir(destDir)
|
||||
print ' unpack %s...' % distribution
|
||||
print(' unpack %s...' % distribution)
|
||||
unpackLogFile = '%s/unpack-%s-maven-checks.log' % (tmpDir, distribution)
|
||||
run('tar xzf %s/%s' % (tmpDir, distribution), unpackLogFile)
|
||||
if project == 'solr': # unpack the Solr war
|
||||
unpackLogFile = '%s/unpack-solr-war-maven-checks.log' % tmpDir
|
||||
print ' unpack Solr war...'
|
||||
print(' unpack Solr war...')
|
||||
run('jar xvf */dist/*.war', unpackLogFile)
|
||||
distributionFiles[project] = []
|
||||
for root, dirs, files in os.walk(destDir):
|
||||
|
@ -719,7 +725,7 @@ def getDistributionsForMavenChecks(tmpDir, version, baseURL):
|
|||
def checkJavadocAndSourceArtifacts(nonMavenizedDeps, artifacts, version):
|
||||
for project in ('lucene', 'solr'):
|
||||
for artifact in artifacts[project]:
|
||||
if artifact.endswith(version + '.jar') and artifact not in nonMavenizedDeps.keys():
|
||||
if artifact.endswith(version + '.jar') and artifact not in list(nonMavenizedDeps.keys()):
|
||||
javadocJar = artifact[:-4] + '-javadoc.jar'
|
||||
if javadocJar not in artifacts[project]:
|
||||
raise RuntimeError('missing: %s' % javadocJar)
|
||||
|
@ -732,7 +738,7 @@ def checkIdenticalNonMavenizedDeps(distributionFiles, nonMavenizedDeps):
|
|||
distFilenames = dict()
|
||||
for file in distributionFiles[project]:
|
||||
distFilenames[os.path.basename(file)] = file
|
||||
for dep in nonMavenizedDeps.keys():
|
||||
for dep in list(nonMavenizedDeps.keys()):
|
||||
if ('/%s/' % project) in dep:
|
||||
depOrigFilename = os.path.basename(nonMavenizedDeps[dep])
|
||||
if not depOrigFilename in distFilenames:
|
||||
|
@ -753,9 +759,9 @@ def checkIdenticalMavenArtifacts(distributionFiles, nonMavenizedDeps, artifacts,
|
|||
distFilenames[baseName] = file
|
||||
for artifact in artifacts[project]:
|
||||
if reJarWar.search(artifact):
|
||||
if artifact not in nonMavenizedDeps.keys():
|
||||
if artifact not in list(nonMavenizedDeps.keys()):
|
||||
artifactFilename = os.path.basename(artifact)
|
||||
if artifactFilename not in distFilenames.keys():
|
||||
if artifactFilename not in list(distFilenames.keys()):
|
||||
raise RuntimeError('Maven artifact %s is not present in %s binary distribution'
|
||||
% (artifact, project))
|
||||
# TODO: Either fix the build to ensure that maven artifacts *are* identical, or recursively compare contents
|
||||
|
@ -772,16 +778,17 @@ def verifyMavenDigests(artifacts):
|
|||
raise RuntimeError('missing: MD5 digest for %s' % artifactFile)
|
||||
if artifactFile + '.sha1' not in artifacts[project]:
|
||||
raise RuntimeError('missing: SHA1 digest for %s' % artifactFile)
|
||||
with open(artifactFile + '.md5', 'r') as md5File:
|
||||
with open(artifactFile + '.md5', encoding='UTF-8') as md5File:
|
||||
md5Expected = md5File.read().strip()
|
||||
with open(artifactFile + '.sha1', 'r') as sha1File:
|
||||
with open(artifactFile + '.sha1', encoding='UTF-8') as sha1File:
|
||||
sha1Expected = sha1File.read().strip()
|
||||
md5 = hashlib.md5()
|
||||
sha1 = hashlib.sha1()
|
||||
inputFile = open(artifactFile)
|
||||
inputFile = open(artifactFile, 'rb')
|
||||
while True:
|
||||
bytes = inputFile.read(65536)
|
||||
if bytes == '': break
|
||||
if len(bytes) == 0:
|
||||
break
|
||||
md5.update(bytes)
|
||||
sha1.update(bytes)
|
||||
inputFile.close()
|
||||
|
@ -846,7 +853,7 @@ def checkNonMavenizedDeps(nonMavenizedDependencies, POMtemplates, artifacts,
|
|||
if releaseBranchSvnURL is None:
|
||||
pomPath = '%s/%s/%s' % (workingCopy, pomDir, pomFile)
|
||||
if os.path.exists(pomPath):
|
||||
doc2 = ET.XML(open(pomPath).read())
|
||||
doc2 = ET.XML(open(pomPath, encoding='UTF-8').read())
|
||||
break
|
||||
else:
|
||||
entries = getDirEntries('%s/%s' % (releaseBranchSvnURL, pomDir))
|
||||
|
@ -891,7 +898,7 @@ def verifyMavenSigs(baseURL, tmpDir, artifacts):
|
|||
gpgHomeDir = '%s/%s.gpg' % (tmpDir, project)
|
||||
if os.path.exists(gpgHomeDir):
|
||||
shutil.rmtree(gpgHomeDir)
|
||||
os.makedirs(gpgHomeDir, 0700)
|
||||
os.makedirs(gpgHomeDir, 0o700)
|
||||
run('gpg --homedir %s --import %s' % (gpgHomeDir, keysFile),
|
||||
'%s/%s.gpg.import.log' % (tmpDir, project))
|
||||
|
||||
|
@ -904,12 +911,12 @@ def verifyMavenSigs(baseURL, tmpDir, artifacts):
|
|||
run('gpg --homedir %s --verify %s %s' % (gpgHomeDir, sigFile, artifactFile),
|
||||
logFile)
|
||||
# Forward any GPG warnings, except the expected one (since its a clean world)
|
||||
f = open(logFile, 'rb')
|
||||
f = open(logFile, encoding='UTF-8')
|
||||
for line in f.readlines():
|
||||
if line.lower().find('warning') != -1 \
|
||||
and line.find('WARNING: This key is not certified with a trusted signature') == -1 \
|
||||
and line.find('WARNING: using insecure memory') == -1:
|
||||
print ' GPG: %s' % line.strip()
|
||||
print(' GPG: %s' % line.strip())
|
||||
f.close()
|
||||
|
||||
# Test trust (this is done with the real users config)
|
||||
|
@ -918,16 +925,16 @@ def verifyMavenSigs(baseURL, tmpDir, artifacts):
|
|||
logFile = '%s/%s.%s.gpg.trust.log' % (tmpDir, project, artifact)
|
||||
run('gpg --verify %s %s' % (sigFile, artifactFile), logFile)
|
||||
# Forward any GPG warnings:
|
||||
f = open(logFile, 'rb')
|
||||
f = open(logFile, encoding='UTF-8')
|
||||
for line in f.readlines():
|
||||
if line.lower().find('warning') != -1 \
|
||||
and line.find('WARNING: This key is not certified with a trusted signature') == -1 \
|
||||
and line.find('WARNING: using insecure memory') == -1:
|
||||
print ' GPG: %s' % line.strip()
|
||||
print(' GPG: %s' % line.strip())
|
||||
f.close()
|
||||
|
||||
sys.stdout.write('.')
|
||||
print
|
||||
print()
|
||||
|
||||
def verifyPOMperBinaryArtifact(artifacts, version):
|
||||
"""verify that each binary jar and war has a corresponding POM file"""
|
||||
|
@ -1023,17 +1030,20 @@ def crawl(downloadedFiles, urlString, targetDir, exclusions=set()):
|
|||
|
||||
def main():
|
||||
|
||||
if len(sys.argv) != 4:
|
||||
print
|
||||
print 'Usage python -u %s BaseURL version tmpDir' % sys.argv[0]
|
||||
print
|
||||
if len(sys.argv) < 4:
|
||||
print()
|
||||
print('Usage python -u %s BaseURL version tmpDir' % sys.argv[0])
|
||||
print()
|
||||
sys.exit(1)
|
||||
|
||||
baseURL = sys.argv[1]
|
||||
version = sys.argv[2]
|
||||
tmpDir = os.path.abspath(sys.argv[3])
|
||||
isSigned = True
|
||||
if len(sys.argv) == 5:
|
||||
isSigned = (sys.argv[4] == "True")
|
||||
|
||||
smokeTest(baseURL, version, tmpDir, True)
|
||||
smokeTest(baseURL, version, tmpDir, isSigned)
|
||||
|
||||
def smokeTest(baseURL, version, tmpDir, isSigned):
|
||||
|
||||
|
@ -1046,11 +1056,11 @@ def smokeTest(baseURL, version, tmpDir, isSigned):
|
|||
|
||||
lucenePath = None
|
||||
solrPath = None
|
||||
print
|
||||
print 'Load release URL "%s"...' % baseURL
|
||||
print()
|
||||
print('Load release URL "%s"...' % baseURL)
|
||||
newBaseURL = unshortenURL(baseURL)
|
||||
if newBaseURL != baseURL:
|
||||
print ' unshortened: %s' % newBaseURL
|
||||
print(' unshortened: %s' % newBaseURL)
|
||||
baseURL = newBaseURL
|
||||
|
||||
for text, subURL in getDirEntries(baseURL):
|
||||
|
@ -1064,23 +1074,28 @@ def smokeTest(baseURL, version, tmpDir, isSigned):
|
|||
if solrPath is None:
|
||||
raise RuntimeError('could not find solr subdir')
|
||||
|
||||
print
|
||||
print 'Test Lucene...'
|
||||
print()
|
||||
print('Test Lucene...')
|
||||
checkSigs('lucene', lucenePath, version, tmpDir, isSigned)
|
||||
for artifact in ('lucene-%s.tgz' % version, 'lucene-%s.zip' % version):
|
||||
unpack('lucene', tmpDir, artifact, version)
|
||||
unpack('lucene', tmpDir, 'lucene-%s-src.tgz' % version, version)
|
||||
|
||||
print
|
||||
print 'Test Solr...'
|
||||
print()
|
||||
print('Test Solr...')
|
||||
checkSigs('solr', solrPath, version, tmpDir, isSigned)
|
||||
for artifact in ('apache-solr-%s.tgz' % version, 'apache-solr-%s.zip' % version):
|
||||
unpack('solr', tmpDir, artifact, version)
|
||||
unpack('solr', tmpDir, 'apache-solr-%s-src.tgz' % version, version)
|
||||
|
||||
print 'Test Maven artifacts for Lucene and Solr...'
|
||||
print('Test Maven artifacts for Lucene and Solr...')
|
||||
checkMaven(baseURL, tmpDir, version, isSigned)
|
||||
|
||||
if __name__ == '__main__':
|
||||
try:
|
||||
main()
|
||||
|
||||
except:
|
||||
import traceback
|
||||
traceback.print_exc()
|
||||
sys.exit(1)
|
||||
sys.exit(0)
|
||||
|
|
|
@ -6,6 +6,15 @@ http://s.apache.org/luceneversions
|
|||
|
||||
======================= Lucene 5.0.0 =======================
|
||||
|
||||
======================= Lucene 4.0.0 =======================
|
||||
|
||||
Bug Fixes
|
||||
|
||||
* LUCENE-4297: BooleanScorer2 would multiply the coord() factor
|
||||
twice for conjunctions: for most users this is no problem, but
|
||||
if you had a customized Similarity that returned something other
|
||||
than 1 when overlap == maxOverlap (always the case for conjunctions),
|
||||
then the score would be incorrect. (Pascal Chollet, Robert Muir)
|
||||
|
||||
======================= Lucene 4.0.0-BETA =======================
|
||||
|
||||
|
@ -15,6 +24,9 @@ New features
|
|||
underlying PayloadFunction's explanation as the explanation
|
||||
for the payload score. (Scott Smerchek via Robert Muir)
|
||||
|
||||
* LUCENE-4069: Added BloomFilteringPostingsFormat for use with low-frequency terms
|
||||
such as primary keys (Mark Harwood, Mike McCandless)
|
||||
|
||||
* LUCENE-4201: Added JapaneseIterationMarkCharFilter to normalize Japanese
|
||||
iteration marks. (Robert Muir, Christian Moen)
|
||||
|
||||
|
@ -34,6 +46,22 @@ New features
|
|||
CharFilterFactories to the lucene-analysis module. The API is still
|
||||
experimental. (Chris Male, Robert Muir, Uwe Schindler)
|
||||
|
||||
* LUCENE-4230: When pulling a DocsAndPositionsEnum you can now
|
||||
specify whether or not you require payloads (in addition to
|
||||
offsets); turning one or both off may allow some codec
|
||||
implementations to optimize the enum implementation. (Robert Muir,
|
||||
Mike McCandless)
|
||||
|
||||
* LUCENE-4203: Add IndexWriter.tryDeleteDocument(AtomicReader reader,
|
||||
int docID), to attempt deletion by docID as long as the provided
|
||||
reader is an NRT reader, and the segment has not yet been merged
|
||||
away (Mike McCandless).
|
||||
|
||||
* LUCENE-4286: Added option to CJKBigramFilter to always also output
|
||||
unigrams. This can be used for a unigram+bigram approach, or at
|
||||
index-time only for better support of short queries.
|
||||
(Tom Burton-West, Robert Muir)
|
||||
|
||||
API Changes
|
||||
|
||||
* LUCENE-4138: update of morfologik (Polish morphological analyzer) to 1.5.3.
|
||||
|
@ -69,6 +97,23 @@ API Changes
|
|||
|
||||
* LUCENE-3747: Support Unicode 6.1.0. (Steve Rowe)
|
||||
|
||||
* LUCENE-3884: Moved ElisionFilter out of org.apache.lucene.analysis.fr
|
||||
package into org.apache.lucene.analysis.util. (Robert Muir)
|
||||
|
||||
* LUCENE-4230: When pulling a DocsAndPositionsEnum you now pass an int
|
||||
flags instead of the previous boolean needOffsets. Currently
|
||||
recognized flags are DocsAndPositionsEnum.FLAG_PAYLOADS and
|
||||
DocsAndPositionsEnum.FLAG_OFFSETS (Robert Muir, Mike McCandless)
|
||||
|
||||
* LUCENE-4273: When pulling a DocsEnum, you can pass an int flags
|
||||
instead of the previous boolean needsFlags; consistent with the changes
|
||||
for DocsAndPositionsEnum in LUCENE-4230. Currently othe only flag
|
||||
is DocsEnum.FLAG_FREQS. (Robert Muir, Mike McCandless)
|
||||
|
||||
* LUCENE-3616: TextField(String, Reader, Store) was reduced to TextField(String, Reader),
|
||||
as the Store parameter didn't make sense: if you supplied Store.YES, you would only
|
||||
receive an exception anyway. (Robert Muir)
|
||||
|
||||
Optimizations
|
||||
|
||||
* LUCENE-4171: Performance improvements to Packed64.
|
||||
|
@ -80,8 +125,19 @@ Optimizations
|
|||
* LUCENE-4235: Remove enforcing of Filter rewrite for NRQ queries.
|
||||
(Uwe Schindler)
|
||||
|
||||
* LUCENE-4279: Regenerated snowball Stemmers from snowball r554,
|
||||
making them substantially more lightweight. Behavior is unchanged.
|
||||
(Robert Muir)
|
||||
|
||||
* LUCENE-4291: Reduced internal buffer size for Jflex-based tokenizers
|
||||
such as StandardTokenizer from 32kb to 8kb.
|
||||
(Raintung Li, Steven Rowe, Robert Muir)
|
||||
|
||||
Bug Fixes
|
||||
|
||||
* LUCENE-4109: BooleanQueries are not parsed correctly with the
|
||||
flexible query parser. (Karsten Rauch via Robert Muir)
|
||||
|
||||
* LUCENE-4176: Fix AnalyzingQueryParser to analyze range endpoints as bytes,
|
||||
so that it works correctly with Analyzers that produce binary non-UTF-8 terms
|
||||
such as CollationAnalyzer. (Nattapong Sirilappanich via Robert Muir)
|
||||
|
@ -113,6 +169,30 @@ Bug Fixes
|
|||
* LUCENE-4245: Make IndexWriter#close() and MergeScheduler#close()
|
||||
non-interruptible. (Mark Miller, Uwe Schindler)
|
||||
|
||||
* LUCENE-4190: restrict allowed filenames that a codec may create to
|
||||
the patterns recognized by IndexFileNames. This also fixes
|
||||
IndexWriter to only delete files matching this pattern from an index
|
||||
directory, to reduce risk when the wrong index path is accidentally
|
||||
passed to IndexWriter (Robert Muir, Mike McCandless)
|
||||
|
||||
* LUCENE-4277: Fix IndexWriter deadlock during rollback if flushable DWPT
|
||||
instance are already checked out and queued up but not yet flushed.
|
||||
(Simon Willnauer)
|
||||
|
||||
* LUCENE-4282: Automaton FuzzyQuery didnt always deliver all results.
|
||||
(Johannes Christen, Uwe Schindler, Robert Muir)
|
||||
|
||||
* LUCENE-4289: Fix minor idf inconsistencies/inefficiencies in highlighter.
|
||||
(Robert Muir)
|
||||
|
||||
Changes in Runtime Behavior
|
||||
|
||||
* LUCENE-4109: Enable position increments in the flexible queryparser by default.
|
||||
(Karsten Rauch via Robert Muir)
|
||||
|
||||
* LUCENE-3616: Field throws exception if you try to set a boost on an
|
||||
unindexed field or one that omits norms. (Robert Muir)
|
||||
|
||||
Build
|
||||
|
||||
* LUCENE-4094: Support overriding file.encoding on forked test JVMs
|
||||
|
|
|
@ -57,30 +57,6 @@ enumeration APIs. Here are the major changes:
|
|||
...
|
||||
}
|
||||
|
||||
The bulk read API has also changed. Instead of this:
|
||||
|
||||
int[] docs = new int[256];
|
||||
int[] freqs = new int[256];
|
||||
|
||||
while(true) {
|
||||
int count = td.read(docs, freqs)
|
||||
if (count == 0) {
|
||||
break;
|
||||
}
|
||||
// use docs[i], freqs[i]
|
||||
}
|
||||
|
||||
do this:
|
||||
|
||||
DocsEnum.BulkReadResult bulk = td.getBulkResult();
|
||||
while(true) {
|
||||
int count = td.read();
|
||||
if (count == 0) {
|
||||
break;
|
||||
}
|
||||
// use bulk.docs.ints[i] and bulk.freqs.ints[i]
|
||||
}
|
||||
|
||||
* TermPositions is renamed to DocsAndPositionsEnum, and no longer
|
||||
extends the docs only enumerator (DocsEnum).
|
||||
|
||||
|
@ -170,7 +146,7 @@ enumeration APIs. Here are the major changes:
|
|||
Bits liveDocs = reader.getLiveDocs();
|
||||
DocsEnum docsEnum = null;
|
||||
|
||||
docsEnum = termsEnum.docs(liveDocs, docsEnum);
|
||||
docsEnum = termsEnum.docs(liveDocs, docsEnum, needsFreqs);
|
||||
|
||||
You can pass in a prior DocsEnum and it will be reused if possible.
|
||||
|
||||
|
@ -187,7 +163,7 @@ enumeration APIs. Here are the major changes:
|
|||
|
||||
String field;
|
||||
BytesRef text;
|
||||
DocsEnum docsEnum = reader.termDocsEnum(reader.getLiveDocs(), field, text);
|
||||
DocsEnum docsEnum = reader.termDocsEnum(reader.getLiveDocs(), field, text, needsFreqs);
|
||||
|
||||
Likewise for DocsAndPositionsEnum.
|
||||
|
||||
|
@ -340,11 +316,12 @@ an AtomicReader. Note: using "atomicity emulators" can cause serious
|
|||
slowdowns due to the need to merge terms, postings, DocValues, and
|
||||
FieldCache, use them with care!
|
||||
|
||||
## LUCENE-2413: Analyzer package changes
|
||||
## LUCENE-2413,LUCENE-3396: Analyzer package changes
|
||||
|
||||
Lucene's core and contrib analyzers, along with Solr's analyzers,
|
||||
were consolidated into lucene/analysis. During the refactoring some
|
||||
package names have changed:
|
||||
package names have changed, and ReusableAnalyzerBase was renamed to
|
||||
Analyzer:
|
||||
|
||||
- o.a.l.analysis.KeywordAnalyzer -> o.a.l.analysis.core.KeywordAnalyzer
|
||||
- o.a.l.analysis.KeywordTokenizer -> o.a.l.analysis.core.KeywordTokenizer
|
||||
|
@ -369,7 +346,7 @@ package names have changed:
|
|||
- o.a.l.analysis.NormalizeCharMap -> o.a.l.analysis.charfilter.NormalizeCharMap
|
||||
- o.a.l.analysis.CharArraySet -> o.a.l.analysis.util.CharArraySet
|
||||
- o.a.l.analysis.CharArrayMap -> o.a.l.analysis.util.CharArrayMap
|
||||
- o.a.l.analysis.ReusableAnalyzerBase -> o.a.l.analysis.util.ReusableAnalyzerBase
|
||||
- o.a.l.analysis.ReusableAnalyzerBase -> o.a.l.analysis.Analyzer
|
||||
- o.a.l.analysis.StopwordAnalyzerBase -> o.a.l.analysis.util.StopwordAnalyzerBase
|
||||
- o.a.l.analysis.WordListLoader -> o.a.l.analysis.util.WordListLoader
|
||||
- o.a.l.analysis.CharTokenizer -> o.a.l.analysis.util.CharTokenizer
|
||||
|
|
|
@ -24,7 +24,6 @@ import java.util.Arrays;
|
|||
import org.apache.lucene.analysis.Analyzer;
|
||||
import org.apache.lucene.analysis.core.LowerCaseFilter;
|
||||
import org.apache.lucene.analysis.core.StopFilter;
|
||||
import org.apache.lucene.analysis.fr.ElisionFilter;
|
||||
import org.apache.lucene.analysis.miscellaneous.KeywordMarkerFilter;
|
||||
import org.apache.lucene.analysis.TokenStream;
|
||||
import org.apache.lucene.analysis.Tokenizer;
|
||||
|
@ -32,6 +31,7 @@ import org.apache.lucene.analysis.snowball.SnowballFilter;
|
|||
import org.apache.lucene.analysis.standard.StandardFilter;
|
||||
import org.apache.lucene.analysis.standard.StandardTokenizer;
|
||||
import org.apache.lucene.analysis.util.CharArraySet;
|
||||
import org.apache.lucene.analysis.util.ElisionFilter;
|
||||
import org.apache.lucene.analysis.util.StopwordAnalyzerBase;
|
||||
import org.apache.lucene.util.Version;
|
||||
import org.tartarus.snowball.ext.CatalanStemmer;
|
||||
|
@ -127,7 +127,7 @@ public final class CatalanAnalyzer extends StopwordAnalyzerBase {
|
|||
Reader reader) {
|
||||
final Tokenizer source = new StandardTokenizer(matchVersion, reader);
|
||||
TokenStream result = new StandardFilter(matchVersion, source);
|
||||
result = new ElisionFilter(matchVersion, result, DEFAULT_ARTICLES);
|
||||
result = new ElisionFilter(result, DEFAULT_ARTICLES);
|
||||
result = new LowerCaseFilter(matchVersion, result);
|
||||
result = new StopFilter(matchVersion, result, stopwords);
|
||||
if(!stemExclusionSet.isEmpty())
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 7/26/12 6:22 PM */
|
||||
/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 8/6/12 11:57 AM */
|
||||
|
||||
package org.apache.lucene.analysis.charfilter;
|
||||
|
||||
|
@ -40,8 +40,8 @@ import org.apache.lucene.analysis.util.OpenStringBuilder;
|
|||
/**
|
||||
* This class is a scanner generated by
|
||||
* <a href="http://www.jflex.de/">JFlex</a> 1.5.0-SNAPSHOT
|
||||
* on 7/26/12 6:22 PM from the specification file
|
||||
* <tt>C:/svn/lucene/dev/trunk/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.jflex</tt>
|
||||
* on 8/6/12 11:57 AM from the specification file
|
||||
* <tt>/home/rmuir/workspace/lucene-trunk/lucene/analysis/common/src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.jflex</tt>
|
||||
*/
|
||||
public final class HTMLStripCharFilter extends BaseCharFilter {
|
||||
|
||||
|
@ -31255,6 +31255,93 @@ public final class HTMLStripCharFilter extends BaseCharFilter {
|
|||
{ yybegin(STYLE);
|
||||
}
|
||||
case 55: break;
|
||||
case 27:
|
||||
{ // add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - 1;
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + 1, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
return BLOCK_LEVEL_START_TAG_REPLACEMENT;
|
||||
}
|
||||
case 56: break;
|
||||
case 30:
|
||||
{ int length = yylength();
|
||||
inputSegment.write(zzBuffer, zzStartRead, length);
|
||||
entitySegment.clear();
|
||||
char ch = entityValues.get(zzBuffer, zzStartRead, length).charValue();
|
||||
entitySegment.append(ch);
|
||||
outputSegment = entitySegment;
|
||||
yybegin(CHARACTER_REFERENCE_TAIL);
|
||||
}
|
||||
case 57: break;
|
||||
case 48:
|
||||
{ inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
// add (previously matched input length) -- current match and substitution handled below
|
||||
cumulativeDiff += yychar - inputStart;
|
||||
// position the offset correction at (already output length) -- substitution handled below
|
||||
int offsetCorrectionPos = outputCharCount;
|
||||
int returnValue;
|
||||
if (escapeSTYLE) {
|
||||
inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
returnValue = outputSegment.nextChar();
|
||||
} else {
|
||||
// add (this match length) - (substitution length)
|
||||
cumulativeDiff += yylength() - 1;
|
||||
// add (substitution length)
|
||||
++offsetCorrectionPos;
|
||||
returnValue = STYLE_REPLACEMENT;
|
||||
}
|
||||
addOffCorrectMap(offsetCorrectionPos, cumulativeDiff);
|
||||
return returnValue;
|
||||
}
|
||||
case 58: break;
|
||||
case 8:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
if (null != escapedTags
|
||||
&& escapedTags.contains(zzBuffer, zzStartRead, yylength())) {
|
||||
yybegin(START_TAG_TAIL_INCLUDE);
|
||||
} else {
|
||||
yybegin(START_TAG_TAIL_SUBSTITUTE);
|
||||
}
|
||||
}
|
||||
case 59: break;
|
||||
case 2:
|
||||
{ inputStart = yychar;
|
||||
inputSegment.clear();
|
||||
inputSegment.append('<');
|
||||
yybegin(LEFT_ANGLE_BRACKET);
|
||||
}
|
||||
case 60: break;
|
||||
case 44:
|
||||
{ restoreState = STYLE_COMMENT; yybegin(SERVER_SIDE_INCLUDE);
|
||||
}
|
||||
case 61: break;
|
||||
case 21:
|
||||
{ previousRestoreState = restoreState;
|
||||
restoreState = SERVER_SIDE_INCLUDE;
|
||||
yybegin(SINGLE_QUOTED_STRING);
|
||||
}
|
||||
case 62: break;
|
||||
case 11:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
yybegin(LEFT_ANGLE_BRACKET_SPACE);
|
||||
}
|
||||
case 63: break;
|
||||
case 35:
|
||||
{ yybegin(SCRIPT);
|
||||
}
|
||||
case 64: break;
|
||||
case 42:
|
||||
{ restoreState = COMMENT; yybegin(SERVER_SIDE_INCLUDE);
|
||||
}
|
||||
case 65: break;
|
||||
case 10:
|
||||
{ inputSegment.append('!'); yybegin(BANG);
|
||||
}
|
||||
case 66: break;
|
||||
case 51:
|
||||
{ // Handle paired UTF-16 surrogates.
|
||||
String surrogatePair = yytext();
|
||||
|
@ -31288,13 +31375,331 @@ public final class HTMLStripCharFilter extends BaseCharFilter {
|
|||
inputSegment.append('#');
|
||||
yybegin(NUMERIC_CHARACTER);
|
||||
}
|
||||
case 56: break;
|
||||
case 21:
|
||||
case 67: break;
|
||||
case 4:
|
||||
{ yypushback(1);
|
||||
outputSegment = inputSegment;
|
||||
outputSegment.restart();
|
||||
yybegin(YYINITIAL);
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
case 68: break;
|
||||
case 43:
|
||||
{ restoreState = SCRIPT_COMMENT; yybegin(SERVER_SIDE_INCLUDE);
|
||||
}
|
||||
case 69: break;
|
||||
case 52:
|
||||
{ // Handle paired UTF-16 surrogates.
|
||||
String surrogatePair = yytext();
|
||||
char highSurrogate = '\u0000';
|
||||
try { // High surrogates are in decimal range [55296, 56319]
|
||||
highSurrogate = (char)Integer.parseInt(surrogatePair.substring(1, 6));
|
||||
} catch(Exception e) { // should never happen
|
||||
assert false: "Exception parsing high surrogate '"
|
||||
+ surrogatePair.substring(1, 6) + "'";
|
||||
}
|
||||
if (Character.isHighSurrogate(highSurrogate)) {
|
||||
outputSegment = entitySegment;
|
||||
outputSegment.clear();
|
||||
try {
|
||||
outputSegment.unsafeWrite
|
||||
((char)Integer.parseInt(surrogatePair.substring(10, 14), 16));
|
||||
} catch(Exception e) { // should never happen
|
||||
assert false: "Exception parsing low surrogate '"
|
||||
+ surrogatePair.substring(10, 14) + "'";
|
||||
}
|
||||
// add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - 2;
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + 2, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
return highSurrogate;
|
||||
}
|
||||
yypushback(surrogatePair.length() - 1); // Consume only '#'
|
||||
inputSegment.append('#');
|
||||
yybegin(NUMERIC_CHARACTER);
|
||||
}
|
||||
case 70: break;
|
||||
case 28:
|
||||
{ restoreState = STYLE_COMMENT; yybegin(SINGLE_QUOTED_STRING);
|
||||
}
|
||||
case 71: break;
|
||||
case 50:
|
||||
{ // Handle paired UTF-16 surrogates.
|
||||
outputSegment = entitySegment;
|
||||
outputSegment.clear();
|
||||
String surrogatePair = yytext();
|
||||
char highSurrogate = '\u0000';
|
||||
try {
|
||||
highSurrogate = (char)Integer.parseInt(surrogatePair.substring(2, 6), 16);
|
||||
} catch(Exception e) { // should never happen
|
||||
assert false: "Exception parsing high surrogate '"
|
||||
+ surrogatePair.substring(2, 6) + "'";
|
||||
}
|
||||
try {
|
||||
outputSegment.unsafeWrite
|
||||
((char)Integer.parseInt(surrogatePair.substring(10, 14), 16));
|
||||
} catch(Exception e) { // should never happen
|
||||
assert false: "Exception parsing low surrogate '"
|
||||
+ surrogatePair.substring(10, 14) + "'";
|
||||
}
|
||||
// add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - 2;
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + 2, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
return highSurrogate;
|
||||
}
|
||||
case 72: break;
|
||||
case 16:
|
||||
{ restoreState = SCRIPT_COMMENT; yybegin(SINGLE_QUOTED_STRING);
|
||||
}
|
||||
case 73: break;
|
||||
case 22:
|
||||
{ previousRestoreState = restoreState;
|
||||
restoreState = SERVER_SIDE_INCLUDE;
|
||||
yybegin(SINGLE_QUOTED_STRING);
|
||||
yybegin(DOUBLE_QUOTED_STRING);
|
||||
}
|
||||
case 57: break;
|
||||
case 74: break;
|
||||
case 26:
|
||||
{ // add (previously matched input length) + (this match length) [ - (substitution length) = 0 ]
|
||||
cumulativeDiff += inputSegment.length() + yylength();
|
||||
// position the correction at (already output length) [ + (substitution length) = 0 ]
|
||||
addOffCorrectMap(outputCharCount, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
outputSegment = inputSegment;
|
||||
yybegin(YYINITIAL);
|
||||
}
|
||||
case 75: break;
|
||||
case 20:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
}
|
||||
case 76: break;
|
||||
case 47:
|
||||
{ // add (previously matched input length) + (this match length) [ - (substitution length) = 0 ]
|
||||
cumulativeDiff += inputSegment.length() + yylength();
|
||||
// position the correction at (already output length) [ + (substitution length) = 0 ]
|
||||
addOffCorrectMap(outputCharCount, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(CDATA);
|
||||
}
|
||||
case 77: break;
|
||||
case 33:
|
||||
{ yybegin(YYINITIAL);
|
||||
if (escapeBR) {
|
||||
inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
return outputSegment.nextChar();
|
||||
} else {
|
||||
// add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - 1;
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + 1, cumulativeDiff);
|
||||
inputSegment.reset();
|
||||
return BR_START_TAG_REPLACEMENT;
|
||||
}
|
||||
}
|
||||
case 78: break;
|
||||
case 23:
|
||||
{ yybegin(restoreState); restoreState = previousRestoreState;
|
||||
}
|
||||
case 79: break;
|
||||
case 32:
|
||||
{ yybegin(COMMENT);
|
||||
}
|
||||
case 80: break;
|
||||
case 24:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
yybegin(YYINITIAL);
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
case 81: break;
|
||||
case 3:
|
||||
{ inputStart = yychar;
|
||||
inputSegment.clear();
|
||||
inputSegment.append('&');
|
||||
yybegin(AMPERSAND);
|
||||
}
|
||||
case 82: break;
|
||||
case 46:
|
||||
{ yybegin(SCRIPT);
|
||||
if (escapeSCRIPT) {
|
||||
inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
inputStart += 1 + yylength();
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
}
|
||||
case 83: break;
|
||||
case 14:
|
||||
{ // add (previously matched input length) + (this match length) [ - (substitution length) = 0 ]
|
||||
cumulativeDiff += inputSegment.length() + yylength();
|
||||
// position the correction at (already output length) [ + (substitution length) = 0 ]
|
||||
addOffCorrectMap(outputCharCount, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
}
|
||||
case 84: break;
|
||||
case 6:
|
||||
{ int matchLength = yylength();
|
||||
inputSegment.write(zzBuffer, zzStartRead, matchLength);
|
||||
if (matchLength <= 7) { // 0x10FFFF = 1114111: max 7 decimal chars
|
||||
String decimalCharRef = yytext();
|
||||
int codePoint = 0;
|
||||
try {
|
||||
codePoint = Integer.parseInt(decimalCharRef);
|
||||
} catch(Exception e) {
|
||||
assert false: "Exception parsing code point '" + decimalCharRef + "'";
|
||||
}
|
||||
if (codePoint <= 0x10FFFF) {
|
||||
outputSegment = entitySegment;
|
||||
outputSegment.clear();
|
||||
if (codePoint >= Character.MIN_SURROGATE
|
||||
&& codePoint <= Character.MAX_SURROGATE) {
|
||||
outputSegment.unsafeWrite(REPLACEMENT_CHARACTER);
|
||||
} else {
|
||||
outputSegment.setLength
|
||||
(Character.toChars(codePoint, outputSegment.getArray(), 0));
|
||||
}
|
||||
yybegin(CHARACTER_REFERENCE_TAIL);
|
||||
} else {
|
||||
outputSegment = inputSegment;
|
||||
yybegin(YYINITIAL);
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
} else {
|
||||
outputSegment = inputSegment;
|
||||
yybegin(YYINITIAL);
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
}
|
||||
case 85: break;
|
||||
case 34:
|
||||
{ // add (previously matched input length) + (this match length) [ - (substitution length) = 0]
|
||||
cumulativeDiff += yychar - inputStart + yylength();
|
||||
// position the correction at (already output length) [ + (substitution length) = 0]
|
||||
addOffCorrectMap(outputCharCount, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
}
|
||||
case 86: break;
|
||||
case 5:
|
||||
{ inputSegment.append('#'); yybegin(NUMERIC_CHARACTER);
|
||||
}
|
||||
case 87: break;
|
||||
case 13:
|
||||
{ inputSegment.append(zzBuffer[zzStartRead]);
|
||||
}
|
||||
case 88: break;
|
||||
case 18:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
if (null != escapedTags
|
||||
&& escapedTags.contains(zzBuffer, zzStartRead, yylength())) {
|
||||
yybegin(END_TAG_TAIL_INCLUDE);
|
||||
} else {
|
||||
yybegin(END_TAG_TAIL_SUBSTITUTE);
|
||||
}
|
||||
}
|
||||
case 89: break;
|
||||
case 40:
|
||||
{ yybegin(SCRIPT_COMMENT);
|
||||
}
|
||||
case 90: break;
|
||||
case 37:
|
||||
{ // add (this match length) [ - (substitution length) = 0 ]
|
||||
cumulativeDiff += yylength();
|
||||
// position the correction at (already output length) [ + (substitution length) = 0 ]
|
||||
addOffCorrectMap(outputCharCount, cumulativeDiff);
|
||||
yybegin(YYINITIAL);
|
||||
}
|
||||
case 91: break;
|
||||
case 12:
|
||||
{ inputSegment.append('/'); yybegin(LEFT_ANGLE_BRACKET_SLASH);
|
||||
}
|
||||
case 92: break;
|
||||
case 9:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
if (null != escapedTags
|
||||
&& escapedTags.contains(zzBuffer, zzStartRead, yylength())) {
|
||||
yybegin(START_TAG_TAIL_INCLUDE);
|
||||
} else {
|
||||
yybegin(START_TAG_TAIL_EXCLUDE);
|
||||
}
|
||||
}
|
||||
case 93: break;
|
||||
case 49:
|
||||
{ inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
// add (previously matched input length) -- current match and substitution handled below
|
||||
cumulativeDiff += yychar - inputStart;
|
||||
// position at (already output length) -- substitution handled below
|
||||
int offsetCorrectionPos = outputCharCount;
|
||||
int returnValue;
|
||||
if (escapeSCRIPT) {
|
||||
inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
returnValue = outputSegment.nextChar();
|
||||
} else {
|
||||
// add (this match length) - (substitution length)
|
||||
cumulativeDiff += yylength() - 1;
|
||||
// add (substitution length)
|
||||
++offsetCorrectionPos;
|
||||
returnValue = SCRIPT_REPLACEMENT;
|
||||
}
|
||||
addOffCorrectMap(offsetCorrectionPos, cumulativeDiff);
|
||||
return returnValue;
|
||||
}
|
||||
case 94: break;
|
||||
case 29:
|
||||
{ restoreState = STYLE_COMMENT; yybegin(DOUBLE_QUOTED_STRING);
|
||||
}
|
||||
case 95: break;
|
||||
case 17:
|
||||
{ restoreState = SCRIPT_COMMENT; yybegin(DOUBLE_QUOTED_STRING);
|
||||
}
|
||||
case 96: break;
|
||||
case 45:
|
||||
{ yybegin(STYLE);
|
||||
if (escapeSTYLE) {
|
||||
inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
inputStart += 1 + yylength();
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
}
|
||||
case 97: break;
|
||||
case 7:
|
||||
{ // add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - outputSegment.length();
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + outputSegment.length(), cumulativeDiff);
|
||||
yybegin(YYINITIAL);
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
case 98: break;
|
||||
case 19:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
if (null != escapedTags
|
||||
&& escapedTags.contains(zzBuffer, zzStartRead, yylength())) {
|
||||
yybegin(END_TAG_TAIL_INCLUDE);
|
||||
} else {
|
||||
yybegin(END_TAG_TAIL_EXCLUDE);
|
||||
}
|
||||
}
|
||||
case 99: break;
|
||||
case 25:
|
||||
{ // add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - 1;
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + 1, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
return BLOCK_LEVEL_END_TAG_REPLACEMENT;
|
||||
}
|
||||
case 100: break;
|
||||
case 31:
|
||||
{ int matchLength = yylength();
|
||||
inputSegment.write(zzBuffer, zzStartRead, matchLength);
|
||||
|
@ -31329,66 +31734,7 @@ public final class HTMLStripCharFilter extends BaseCharFilter {
|
|||
return outputSegment.nextChar();
|
||||
}
|
||||
}
|
||||
case 58: break;
|
||||
case 19:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
if (null != escapedTags
|
||||
&& escapedTags.contains(zzBuffer, zzStartRead, yylength())) {
|
||||
yybegin(END_TAG_TAIL_INCLUDE);
|
||||
} else {
|
||||
yybegin(END_TAG_TAIL_EXCLUDE);
|
||||
}
|
||||
}
|
||||
case 59: break;
|
||||
case 2:
|
||||
{ inputStart = yychar;
|
||||
inputSegment.clear();
|
||||
inputSegment.append('<');
|
||||
yybegin(LEFT_ANGLE_BRACKET);
|
||||
}
|
||||
case 60: break;
|
||||
case 27:
|
||||
{ // add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - 1;
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + 1, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
return BLOCK_LEVEL_START_TAG_REPLACEMENT;
|
||||
}
|
||||
case 61: break;
|
||||
case 44:
|
||||
{ restoreState = STYLE_COMMENT; yybegin(SERVER_SIDE_INCLUDE);
|
||||
}
|
||||
case 62: break;
|
||||
case 35:
|
||||
{ yybegin(SCRIPT);
|
||||
}
|
||||
case 63: break;
|
||||
case 42:
|
||||
{ restoreState = COMMENT; yybegin(SERVER_SIDE_INCLUDE);
|
||||
}
|
||||
case 64: break;
|
||||
case 10:
|
||||
{ inputSegment.append('!'); yybegin(BANG);
|
||||
}
|
||||
case 65: break;
|
||||
case 33:
|
||||
{ yybegin(YYINITIAL);
|
||||
if (escapeBR) {
|
||||
inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
return outputSegment.nextChar();
|
||||
} else {
|
||||
// add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - 1;
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + 1, cumulativeDiff);
|
||||
inputSegment.reset();
|
||||
return BR_START_TAG_REPLACEMENT;
|
||||
}
|
||||
}
|
||||
case 66: break;
|
||||
case 101: break;
|
||||
case 53:
|
||||
{ // Handle paired UTF-16 surrogates.
|
||||
String surrogatePair = yytext();
|
||||
|
@ -31424,288 +31770,7 @@ public final class HTMLStripCharFilter extends BaseCharFilter {
|
|||
inputSegment.append('#');
|
||||
yybegin(NUMERIC_CHARACTER);
|
||||
}
|
||||
case 67: break;
|
||||
case 43:
|
||||
{ restoreState = SCRIPT_COMMENT; yybegin(SERVER_SIDE_INCLUDE);
|
||||
}
|
||||
case 68: break;
|
||||
case 30:
|
||||
{ int length = yylength();
|
||||
inputSegment.write(zzBuffer, zzStartRead, length);
|
||||
entitySegment.clear();
|
||||
char ch = entityValues.get(zzBuffer, zzStartRead, length).charValue();
|
||||
entitySegment.append(ch);
|
||||
outputSegment = entitySegment;
|
||||
yybegin(CHARACTER_REFERENCE_TAIL);
|
||||
}
|
||||
case 69: break;
|
||||
case 28:
|
||||
{ restoreState = STYLE_COMMENT; yybegin(SINGLE_QUOTED_STRING);
|
||||
}
|
||||
case 70: break;
|
||||
case 3:
|
||||
{ inputStart = yychar;
|
||||
inputSegment.clear();
|
||||
inputSegment.append('&');
|
||||
yybegin(AMPERSAND);
|
||||
}
|
||||
case 71: break;
|
||||
case 16:
|
||||
{ restoreState = SCRIPT_COMMENT; yybegin(SINGLE_QUOTED_STRING);
|
||||
}
|
||||
case 72: break;
|
||||
case 52:
|
||||
{ // Handle paired UTF-16 surrogates.
|
||||
String surrogatePair = yytext();
|
||||
char highSurrogate = '\u0000';
|
||||
try { // High surrogates are in decimal range [55296, 56319]
|
||||
highSurrogate = (char)Integer.parseInt(surrogatePair.substring(1, 6));
|
||||
} catch(Exception e) { // should never happen
|
||||
assert false: "Exception parsing high surrogate '"
|
||||
+ surrogatePair.substring(1, 6) + "'";
|
||||
}
|
||||
if (Character.isHighSurrogate(highSurrogate)) {
|
||||
outputSegment = entitySegment;
|
||||
outputSegment.clear();
|
||||
try {
|
||||
outputSegment.unsafeWrite
|
||||
((char)Integer.parseInt(surrogatePair.substring(10, 14), 16));
|
||||
} catch(Exception e) { // should never happen
|
||||
assert false: "Exception parsing low surrogate '"
|
||||
+ surrogatePair.substring(10, 14) + "'";
|
||||
}
|
||||
// add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - 2;
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + 2, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
return highSurrogate;
|
||||
}
|
||||
yypushback(surrogatePair.length() - 1); // Consume only '#'
|
||||
inputSegment.append('#');
|
||||
yybegin(NUMERIC_CHARACTER);
|
||||
}
|
||||
case 73: break;
|
||||
case 6:
|
||||
{ int matchLength = yylength();
|
||||
inputSegment.write(zzBuffer, zzStartRead, matchLength);
|
||||
if (matchLength <= 7) { // 0x10FFFF = 1114111: max 7 decimal chars
|
||||
String decimalCharRef = yytext();
|
||||
int codePoint = 0;
|
||||
try {
|
||||
codePoint = Integer.parseInt(decimalCharRef);
|
||||
} catch(Exception e) {
|
||||
assert false: "Exception parsing code point '" + decimalCharRef + "'";
|
||||
}
|
||||
if (codePoint <= 0x10FFFF) {
|
||||
outputSegment = entitySegment;
|
||||
outputSegment.clear();
|
||||
if (codePoint >= Character.MIN_SURROGATE
|
||||
&& codePoint <= Character.MAX_SURROGATE) {
|
||||
outputSegment.unsafeWrite(REPLACEMENT_CHARACTER);
|
||||
} else {
|
||||
outputSegment.setLength
|
||||
(Character.toChars(codePoint, outputSegment.getArray(), 0));
|
||||
}
|
||||
yybegin(CHARACTER_REFERENCE_TAIL);
|
||||
} else {
|
||||
outputSegment = inputSegment;
|
||||
yybegin(YYINITIAL);
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
} else {
|
||||
outputSegment = inputSegment;
|
||||
yybegin(YYINITIAL);
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
}
|
||||
case 74: break;
|
||||
case 37:
|
||||
{ // add (this match length) [ - (substitution length) = 0 ]
|
||||
cumulativeDiff += yylength();
|
||||
// position the correction at (already output length) [ + (substitution length) = 0 ]
|
||||
addOffCorrectMap(outputCharCount, cumulativeDiff);
|
||||
yybegin(YYINITIAL);
|
||||
}
|
||||
case 75: break;
|
||||
case 8:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
if (null != escapedTags
|
||||
&& escapedTags.contains(zzBuffer, zzStartRead, yylength())) {
|
||||
yybegin(START_TAG_TAIL_INCLUDE);
|
||||
} else {
|
||||
yybegin(START_TAG_TAIL_SUBSTITUTE);
|
||||
}
|
||||
}
|
||||
case 76: break;
|
||||
case 46:
|
||||
{ yybegin(SCRIPT);
|
||||
if (escapeSCRIPT) {
|
||||
inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
inputStart += 1 + yylength();
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
}
|
||||
case 77: break;
|
||||
case 11:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
yybegin(LEFT_ANGLE_BRACKET_SPACE);
|
||||
}
|
||||
case 78: break;
|
||||
case 20:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
}
|
||||
case 79: break;
|
||||
case 34:
|
||||
{ // add (previously matched input length) + (this match length) [ - (substitution length) = 0]
|
||||
cumulativeDiff += yychar - inputStart + yylength();
|
||||
// position the correction at (already output length) [ + (substitution length) = 0]
|
||||
addOffCorrectMap(outputCharCount, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
}
|
||||
case 80: break;
|
||||
case 23:
|
||||
{ yybegin(restoreState); restoreState = previousRestoreState;
|
||||
}
|
||||
case 81: break;
|
||||
case 32:
|
||||
{ yybegin(COMMENT);
|
||||
}
|
||||
case 82: break;
|
||||
case 14:
|
||||
{ // add (previously matched input length) + (this match length) [ - (substitution length) = 0 ]
|
||||
cumulativeDiff += inputSegment.length() + yylength();
|
||||
// position the correction at (already output length) [ + (substitution length) = 0 ]
|
||||
addOffCorrectMap(outputCharCount, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
}
|
||||
case 83: break;
|
||||
case 18:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
if (null != escapedTags
|
||||
&& escapedTags.contains(zzBuffer, zzStartRead, yylength())) {
|
||||
yybegin(END_TAG_TAIL_INCLUDE);
|
||||
} else {
|
||||
yybegin(END_TAG_TAIL_SUBSTITUTE);
|
||||
}
|
||||
}
|
||||
case 84: break;
|
||||
case 25:
|
||||
{ // add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - 1;
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + 1, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
return BLOCK_LEVEL_END_TAG_REPLACEMENT;
|
||||
}
|
||||
case 85: break;
|
||||
case 7:
|
||||
{ // add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - outputSegment.length();
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + outputSegment.length(), cumulativeDiff);
|
||||
yybegin(YYINITIAL);
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
case 86: break;
|
||||
case 48:
|
||||
{ inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
// add (previously matched input length) -- current match and substitution handled below
|
||||
cumulativeDiff += yychar - inputStart;
|
||||
// position the offset correction at (already output length) -- substitution handled below
|
||||
int offsetCorrectionPos = outputCharCount;
|
||||
int returnValue;
|
||||
if (escapeSTYLE) {
|
||||
inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
returnValue = outputSegment.nextChar();
|
||||
} else {
|
||||
// add (this match length) - (substitution length)
|
||||
cumulativeDiff += yylength() - 1;
|
||||
// add (substitution length)
|
||||
++offsetCorrectionPos;
|
||||
returnValue = STYLE_REPLACEMENT;
|
||||
}
|
||||
addOffCorrectMap(offsetCorrectionPos, cumulativeDiff);
|
||||
return returnValue;
|
||||
}
|
||||
case 87: break;
|
||||
case 5:
|
||||
{ inputSegment.append('#'); yybegin(NUMERIC_CHARACTER);
|
||||
}
|
||||
case 88: break;
|
||||
case 26:
|
||||
{ // add (previously matched input length) + (this match length) [ - (substitution length) = 0 ]
|
||||
cumulativeDiff += inputSegment.length() + yylength();
|
||||
// position the correction at (already output length) [ + (substitution length) = 0 ]
|
||||
addOffCorrectMap(outputCharCount, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
outputSegment = inputSegment;
|
||||
yybegin(YYINITIAL);
|
||||
}
|
||||
case 89: break;
|
||||
case 13:
|
||||
{ inputSegment.append(zzBuffer[zzStartRead]);
|
||||
}
|
||||
case 90: break;
|
||||
case 50:
|
||||
{ // Handle paired UTF-16 surrogates.
|
||||
outputSegment = entitySegment;
|
||||
outputSegment.clear();
|
||||
String surrogatePair = yytext();
|
||||
char highSurrogate = '\u0000';
|
||||
try {
|
||||
highSurrogate = (char)Integer.parseInt(surrogatePair.substring(2, 6), 16);
|
||||
} catch(Exception e) { // should never happen
|
||||
assert false: "Exception parsing high surrogate '"
|
||||
+ surrogatePair.substring(2, 6) + "'";
|
||||
}
|
||||
try {
|
||||
outputSegment.unsafeWrite
|
||||
((char)Integer.parseInt(surrogatePair.substring(10, 14), 16));
|
||||
} catch(Exception e) { // should never happen
|
||||
assert false: "Exception parsing low surrogate '"
|
||||
+ surrogatePair.substring(10, 14) + "'";
|
||||
}
|
||||
// add (previously matched input length) + (this match length) - (substitution length)
|
||||
cumulativeDiff += inputSegment.length() + yylength() - 2;
|
||||
// position the correction at (already output length) + (substitution length)
|
||||
addOffCorrectMap(outputCharCount + 2, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
return highSurrogate;
|
||||
}
|
||||
case 91: break;
|
||||
case 40:
|
||||
{ yybegin(SCRIPT_COMMENT);
|
||||
}
|
||||
case 92: break;
|
||||
case 45:
|
||||
{ yybegin(STYLE);
|
||||
if (escapeSTYLE) {
|
||||
inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
inputStart += 1 + yylength();
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
}
|
||||
case 93: break;
|
||||
case 22:
|
||||
{ previousRestoreState = restoreState;
|
||||
restoreState = SERVER_SIDE_INCLUDE;
|
||||
yybegin(DOUBLE_QUOTED_STRING);
|
||||
}
|
||||
case 94: break;
|
||||
case 12:
|
||||
{ inputSegment.append('/'); yybegin(LEFT_ANGLE_BRACKET_SLASH);
|
||||
}
|
||||
case 95: break;
|
||||
case 102: break;
|
||||
case 36:
|
||||
{ yybegin(YYINITIAL);
|
||||
if (escapeBR) {
|
||||
|
@ -31721,83 +31786,18 @@ public final class HTMLStripCharFilter extends BaseCharFilter {
|
|||
return BR_END_TAG_REPLACEMENT;
|
||||
}
|
||||
}
|
||||
case 96: break;
|
||||
case 24:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
yybegin(YYINITIAL);
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
case 97: break;
|
||||
case 47:
|
||||
{ // add (previously matched input length) + (this match length) [ - (substitution length) = 0 ]
|
||||
cumulativeDiff += inputSegment.length() + yylength();
|
||||
// position the correction at (already output length) [ + (substitution length) = 0 ]
|
||||
addOffCorrectMap(outputCharCount, cumulativeDiff);
|
||||
inputSegment.clear();
|
||||
yybegin(CDATA);
|
||||
}
|
||||
case 98: break;
|
||||
case 29:
|
||||
{ restoreState = STYLE_COMMENT; yybegin(DOUBLE_QUOTED_STRING);
|
||||
}
|
||||
case 99: break;
|
||||
case 17:
|
||||
{ restoreState = SCRIPT_COMMENT; yybegin(DOUBLE_QUOTED_STRING);
|
||||
}
|
||||
case 100: break;
|
||||
case 9:
|
||||
{ inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
if (null != escapedTags
|
||||
&& escapedTags.contains(zzBuffer, zzStartRead, yylength())) {
|
||||
yybegin(START_TAG_TAIL_INCLUDE);
|
||||
} else {
|
||||
yybegin(START_TAG_TAIL_EXCLUDE);
|
||||
}
|
||||
}
|
||||
case 101: break;
|
||||
case 49:
|
||||
{ inputSegment.clear();
|
||||
yybegin(YYINITIAL);
|
||||
// add (previously matched input length) -- current match and substitution handled below
|
||||
cumulativeDiff += yychar - inputStart;
|
||||
// position at (already output length) -- substitution handled below
|
||||
int offsetCorrectionPos = outputCharCount;
|
||||
int returnValue;
|
||||
if (escapeSCRIPT) {
|
||||
inputSegment.write(zzBuffer, zzStartRead, yylength());
|
||||
outputSegment = inputSegment;
|
||||
returnValue = outputSegment.nextChar();
|
||||
} else {
|
||||
// add (this match length) - (substitution length)
|
||||
cumulativeDiff += yylength() - 1;
|
||||
// add (substitution length)
|
||||
++offsetCorrectionPos;
|
||||
returnValue = SCRIPT_REPLACEMENT;
|
||||
}
|
||||
addOffCorrectMap(offsetCorrectionPos, cumulativeDiff);
|
||||
return returnValue;
|
||||
}
|
||||
case 102: break;
|
||||
case 103: break;
|
||||
case 38:
|
||||
{ yybegin(restoreState);
|
||||
}
|
||||
case 103: break;
|
||||
case 104: break;
|
||||
case 41:
|
||||
{ yybegin(STYLE_COMMENT);
|
||||
}
|
||||
case 104: break;
|
||||
case 105: break;
|
||||
case 1:
|
||||
{ return zzBuffer[zzStartRead];
|
||||
}
|
||||
case 105: break;
|
||||
case 4:
|
||||
{ yypushback(1);
|
||||
outputSegment = inputSegment;
|
||||
outputSegment.restart();
|
||||
yybegin(YYINITIAL);
|
||||
return outputSegment.nextChar();
|
||||
}
|
||||
case 106: break;
|
||||
default:
|
||||
if (zzInput == YYEOF && zzStartRead == zzCurrentPos) {
|
||||
|
|
|
@ -141,9 +141,9 @@ InlineElment = ( [aAbBiIqQsSuU] |
|
|||
[vV][aA][rR] )
|
||||
|
||||
|
||||
%include src/java/org/apache/lucene/analysis/charfilter/HTMLCharacterEntities.jflex
|
||||
%include HTMLCharacterEntities.jflex
|
||||
|
||||
%include src/java/org/apache/lucene/analysis/charfilter/HTMLStripCharFilter.SUPPLEMENTARY.jflex-macro
|
||||
%include HTMLStripCharFilter.SUPPLEMENTARY.jflex-macro
|
||||
|
||||
%{
|
||||
private static final int INITIAL_INPUT_SEGMENT_SIZE = 1024;
|
||||
|
|
|
@ -24,6 +24,8 @@ import org.apache.lucene.analysis.TokenStream;
|
|||
import org.apache.lucene.analysis.standard.StandardTokenizer;
|
||||
import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
|
||||
import org.apache.lucene.analysis.tokenattributes.OffsetAttribute;
|
||||
import org.apache.lucene.analysis.tokenattributes.PositionIncrementAttribute;
|
||||
import org.apache.lucene.analysis.tokenattributes.PositionLengthAttribute;
|
||||
import org.apache.lucene.analysis.tokenattributes.TypeAttribute;
|
||||
import org.apache.lucene.util.ArrayUtil;
|
||||
|
||||
|
@ -35,6 +37,12 @@ import org.apache.lucene.util.ArrayUtil;
|
|||
* {@link #CJKBigramFilter(TokenStream, int)} to explicitly control which
|
||||
* of the CJK scripts are turned into bigrams.
|
||||
* <p>
|
||||
* By default, when a CJK character has no adjacent characters to form
|
||||
* a bigram, it is output in unigram form. If you want to always output
|
||||
* both unigrams and bigrams, set the <code>outputUnigrams</code>
|
||||
* flag in {@link CJKBigramFilter#CJKBigramFilter(TokenStream, int, boolean)}.
|
||||
* This can be used for a combined unigram+bigram approach.
|
||||
* <p>
|
||||
* In all cases, all non-CJK input is passed thru unmodified.
|
||||
*/
|
||||
public final class CJKBigramFilter extends TokenFilter {
|
||||
|
@ -68,9 +76,15 @@ public final class CJKBigramFilter extends TokenFilter {
|
|||
private final Object doKatakana;
|
||||
private final Object doHangul;
|
||||
|
||||
// true if we should output unigram tokens always
|
||||
private final boolean outputUnigrams;
|
||||
private boolean ngramState; // false = output unigram, true = output bigram
|
||||
|
||||
private final CharTermAttribute termAtt = addAttribute(CharTermAttribute.class);
|
||||
private final TypeAttribute typeAtt = addAttribute(TypeAttribute.class);
|
||||
private final OffsetAttribute offsetAtt = addAttribute(OffsetAttribute.class);
|
||||
private final PositionIncrementAttribute posIncAtt = addAttribute(PositionIncrementAttribute.class);
|
||||
private final PositionLengthAttribute posLengthAtt = addAttribute(PositionLengthAttribute.class);
|
||||
|
||||
// buffers containing codepoint and offsets in parallel
|
||||
int buffer[] = new int[8];
|
||||
|
@ -88,23 +102,36 @@ public final class CJKBigramFilter extends TokenFilter {
|
|||
|
||||
/**
|
||||
* Calls {@link CJKBigramFilter#CJKBigramFilter(TokenStream, int)
|
||||
* CJKBigramFilter(HAN | HIRAGANA | KATAKANA | HANGUL)}
|
||||
* CJKBigramFilter(in, HAN | HIRAGANA | KATAKANA | HANGUL)}
|
||||
*/
|
||||
public CJKBigramFilter(TokenStream in) {
|
||||
this(in, HAN | HIRAGANA | KATAKANA | HANGUL);
|
||||
}
|
||||
|
||||
/**
|
||||
* Create a new CJKBigramFilter, specifying which writing systems should be bigrammed.
|
||||
* @param flags OR'ed set from {@link CJKBigramFilter#HAN}, {@link CJKBigramFilter#HIRAGANA},
|
||||
* {@link CJKBigramFilter#KATAKANA}, {@link CJKBigramFilter#HANGUL}
|
||||
* Calls {@link CJKBigramFilter#CJKBigramFilter(TokenStream, int, boolean)
|
||||
* CJKBigramFilter(in, flags, false)}
|
||||
*/
|
||||
public CJKBigramFilter(TokenStream in, int flags) {
|
||||
this(in, flags, false);
|
||||
}
|
||||
|
||||
/**
|
||||
* Create a new CJKBigramFilter, specifying which writing systems should be bigrammed,
|
||||
* and whether or not unigrams should also be output.
|
||||
* @param flags OR'ed set from {@link CJKBigramFilter#HAN}, {@link CJKBigramFilter#HIRAGANA},
|
||||
* {@link CJKBigramFilter#KATAKANA}, {@link CJKBigramFilter#HANGUL}
|
||||
* @param outputUnigrams true if unigrams for the selected writing systems should also be output.
|
||||
* when this is false, this is only done when there are no adjacent characters to form
|
||||
* a bigram.
|
||||
*/
|
||||
public CJKBigramFilter(TokenStream in, int flags, boolean outputUnigrams) {
|
||||
super(in);
|
||||
doHan = (flags & HAN) == 0 ? NO : HAN_TYPE;
|
||||
doHiragana = (flags & HIRAGANA) == 0 ? NO : HIRAGANA_TYPE;
|
||||
doKatakana = (flags & KATAKANA) == 0 ? NO : KATAKANA_TYPE;
|
||||
doHangul = (flags & HANGUL) == 0 ? NO : HANGUL_TYPE;
|
||||
this.outputUnigrams = outputUnigrams;
|
||||
}
|
||||
|
||||
/*
|
||||
|
@ -120,7 +147,24 @@ public final class CJKBigramFilter extends TokenFilter {
|
|||
// case 1: we have multiple remaining codepoints buffered,
|
||||
// so we can emit a bigram here.
|
||||
|
||||
if (outputUnigrams) {
|
||||
|
||||
// when also outputting unigrams, we output the unigram first,
|
||||
// then rewind back to revisit the bigram.
|
||||
// so an input of ABC is A + (rewind)AB + B + (rewind)BC + C
|
||||
// the logic in hasBufferedUnigram ensures we output the C,
|
||||
// even though it did actually have adjacent CJK characters.
|
||||
|
||||
if (ngramState) {
|
||||
flushBigram();
|
||||
} else {
|
||||
flushUnigram();
|
||||
index--;
|
||||
}
|
||||
ngramState = !ngramState;
|
||||
} else {
|
||||
flushBigram();
|
||||
}
|
||||
return true;
|
||||
} else if (doNext()) {
|
||||
|
||||
|
@ -260,6 +304,11 @@ public final class CJKBigramFilter extends TokenFilter {
|
|||
termAtt.setLength(len2);
|
||||
offsetAtt.setOffset(startOffset[index], endOffset[index+1]);
|
||||
typeAtt.setType(DOUBLE_TYPE);
|
||||
// when outputting unigrams, all bigrams are synonyms that span two unigrams
|
||||
if (outputUnigrams) {
|
||||
posIncAtt.setPositionIncrement(0);
|
||||
posLengthAtt.setPositionLength(2);
|
||||
}
|
||||
index++;
|
||||
}
|
||||
|
||||
|
@ -292,8 +341,14 @@ public final class CJKBigramFilter extends TokenFilter {
|
|||
* inputs.
|
||||
*/
|
||||
private boolean hasBufferedUnigram() {
|
||||
if (outputUnigrams) {
|
||||
// when outputting unigrams always
|
||||
return bufferLen - index == 1;
|
||||
} else {
|
||||
// otherwise its only when we have a lone CJK character
|
||||
return bufferLen == 1 && index == 0;
|
||||
}
|
||||
}
|
||||
|
||||
@Override
|
||||
public void reset() throws IOException {
|
||||
|
@ -303,5 +358,6 @@ public final class CJKBigramFilter extends TokenFilter {
|
|||
lastEndOffset = 0;
|
||||
loneState = null;
|
||||
exhausted = false;
|
||||
ngramState = false;
|
||||
}
|
||||
}
|
||||
|
|
|
@ -33,12 +33,13 @@ import org.apache.lucene.analysis.util.TokenFilterFactory;
|
|||
* <filter class="solr.LowerCaseFilterFactory"/>
|
||||
* <filter class="solr.CJKBigramFilterFactory"
|
||||
* han="true" hiragana="true"
|
||||
* katakana="true" hangul="true" />
|
||||
* katakana="true" hangul="true" outputUnigrams="false" />
|
||||
* </analyzer>
|
||||
* </fieldType></pre>
|
||||
*/
|
||||
public class CJKBigramFilterFactory extends TokenFilterFactory {
|
||||
int flags;
|
||||
boolean outputUnigrams;
|
||||
|
||||
@Override
|
||||
public void init(Map<String,String> args) {
|
||||
|
@ -56,10 +57,11 @@ public class CJKBigramFilterFactory extends TokenFilterFactory {
|
|||
if (getBoolean("hangul", true)) {
|
||||
flags |= CJKBigramFilter.HANGUL;
|
||||
}
|
||||
outputUnigrams = getBoolean("outputUnigrams", false);
|
||||
}
|
||||
|
||||
@Override
|
||||
public TokenStream create(TokenStream input) {
|
||||
return new CJKBigramFilter(input, flags);
|
||||
return new CJKBigramFilter(input, flags, outputUnigrams);
|
||||
}
|
||||
}
|
||||
|
|
|
@ -28,6 +28,7 @@ import org.apache.lucene.analysis.standard.StandardFilter;
|
|||
import org.apache.lucene.analysis.standard.StandardTokenizer;
|
||||
import org.apache.lucene.analysis.standard.StandardAnalyzer; // for javadoc
|
||||
import org.apache.lucene.analysis.util.CharArraySet;
|
||||
import org.apache.lucene.analysis.util.ElisionFilter;
|
||||
import org.apache.lucene.analysis.util.StopwordAnalyzerBase;
|
||||
import org.apache.lucene.analysis.util.WordlistLoader;
|
||||
import org.apache.lucene.util.IOUtils;
|
||||
|
@ -35,6 +36,7 @@ import org.apache.lucene.util.Version;
|
|||
|
||||
import java.io.IOException;
|
||||
import java.io.Reader;
|
||||
import java.util.Arrays;
|
||||
|
||||
/**
|
||||
* {@link Analyzer} for French language.
|
||||
|
@ -54,6 +56,11 @@ public final class FrenchAnalyzer extends StopwordAnalyzerBase {
|
|||
/** File containing default French stopwords. */
|
||||
public final static String DEFAULT_STOPWORD_FILE = "french_stop.txt";
|
||||
|
||||
/** Default set of articles for ElisionFilter */
|
||||
public static final CharArraySet DEFAULT_ARTICLES = CharArraySet.unmodifiableSet(
|
||||
new CharArraySet(Version.LUCENE_CURRENT, Arrays.asList(
|
||||
"l", "m", "t", "qu", "n", "s", "j"), true));
|
||||
|
||||
/**
|
||||
* Contains words that should be indexed but not stemmed.
|
||||
*/
|
||||
|
@ -134,7 +141,7 @@ public final class FrenchAnalyzer extends StopwordAnalyzerBase {
|
|||
Reader reader) {
|
||||
final Tokenizer source = new StandardTokenizer(matchVersion, reader);
|
||||
TokenStream result = new StandardFilter(matchVersion, source);
|
||||
result = new ElisionFilter(matchVersion, result);
|
||||
result = new ElisionFilter(result, DEFAULT_ARTICLES);
|
||||
result = new LowerCaseFilter(matchVersion, result);
|
||||
result = new StopFilter(matchVersion, result, stopwords);
|
||||
if(!excltable.isEmpty())
|
||||
|
|
|
@ -23,7 +23,6 @@ import java.util.Arrays;
|
|||
|
||||
import org.apache.lucene.analysis.Analyzer;
|
||||
import org.apache.lucene.analysis.core.StopFilter;
|
||||
import org.apache.lucene.analysis.fr.ElisionFilter;
|
||||
import org.apache.lucene.analysis.miscellaneous.KeywordMarkerFilter;
|
||||
import org.apache.lucene.analysis.TokenStream;
|
||||
import org.apache.lucene.analysis.Tokenizer;
|
||||
|
@ -31,6 +30,7 @@ import org.apache.lucene.analysis.snowball.SnowballFilter;
|
|||
import org.apache.lucene.analysis.standard.StandardFilter;
|
||||
import org.apache.lucene.analysis.standard.StandardTokenizer;
|
||||
import org.apache.lucene.analysis.util.CharArraySet;
|
||||
import org.apache.lucene.analysis.util.ElisionFilter;
|
||||
import org.apache.lucene.analysis.util.StopwordAnalyzerBase;
|
||||
import org.apache.lucene.util.Version;
|
||||
import org.tartarus.snowball.ext.IrishStemmer;
|
||||
|
@ -140,7 +140,7 @@ public final class IrishAnalyzer extends StopwordAnalyzerBase {
|
|||
StopFilter s = new StopFilter(matchVersion, result, HYPHENATIONS);
|
||||
s.setEnablePositionIncrements(false);
|
||||
result = s;
|
||||
result = new ElisionFilter(matchVersion, result, DEFAULT_ARTICLES);
|
||||
result = new ElisionFilter(result, DEFAULT_ARTICLES);
|
||||
result = new IrishLowerCaseFilter(result);
|
||||
result = new StopFilter(matchVersion, result, stopwords);
|
||||
if(!stemExclusionSet.isEmpty())
|
||||
|
|
|
@ -24,7 +24,6 @@ import java.util.Arrays;
|
|||
import org.apache.lucene.analysis.Analyzer;
|
||||
import org.apache.lucene.analysis.core.LowerCaseFilter;
|
||||
import org.apache.lucene.analysis.core.StopFilter;
|
||||
import org.apache.lucene.analysis.fr.ElisionFilter;
|
||||
import org.apache.lucene.analysis.miscellaneous.KeywordMarkerFilter;
|
||||
import org.apache.lucene.analysis.TokenStream;
|
||||
import org.apache.lucene.analysis.Tokenizer;
|
||||
|
@ -32,6 +31,7 @@ import org.apache.lucene.analysis.snowball.SnowballFilter;
|
|||
import org.apache.lucene.analysis.standard.StandardFilter;
|
||||
import org.apache.lucene.analysis.standard.StandardTokenizer;
|
||||
import org.apache.lucene.analysis.util.CharArraySet;
|
||||
import org.apache.lucene.analysis.util.ElisionFilter;
|
||||
import org.apache.lucene.analysis.util.StopwordAnalyzerBase;
|
||||
import org.apache.lucene.analysis.util.WordlistLoader;
|
||||
import org.apache.lucene.util.IOUtils;
|
||||
|
@ -129,7 +129,7 @@ public final class ItalianAnalyzer extends StopwordAnalyzerBase {
|
|||
Reader reader) {
|
||||
final Tokenizer source = new StandardTokenizer(matchVersion, reader);
|
||||
TokenStream result = new StandardFilter(matchVersion, source);
|
||||
result = new ElisionFilter(matchVersion, result, DEFAULT_ARTICLES);
|
||||
result = new ElisionFilter(result, DEFAULT_ARTICLES);
|
||||
result = new LowerCaseFilter(matchVersion, result);
|
||||
result = new StopFilter(matchVersion, result, stopwords);
|
||||
if(!stemExclusionSet.isEmpty())
|
||||
|
|
|
@ -27,13 +27,47 @@ import org.apache.lucene.analysis.util.TokenizerFactory;
|
|||
|
||||
/**
|
||||
* Factory for {@link PathHierarchyTokenizer}.
|
||||
* <pre class="prettyprint" >
|
||||
* <fieldType name="text_path" class="solr.TextField" positionIncrementGap="100">
|
||||
* <analyzer>
|
||||
* <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="\" replace="/"/>
|
||||
* </analyzer>
|
||||
* </fieldType></pre>
|
||||
* <p>
|
||||
* This factory is typically configured for use only in the <code>index</code>
|
||||
* Analyzer (or only in the <code>query</code> Analyzer, but never both).
|
||||
* </p>
|
||||
* <p>
|
||||
* For example, in the configuration below a query for
|
||||
* <code>Books/NonFic</code> will match documents indexed with values like
|
||||
* <code>Books/NonFic</code>, <code>Books/NonFic/Law</code>,
|
||||
* <code>Books/NonFic/Science/Physics</code>, etc. But it will not match
|
||||
* documents indexed with values like <code>Books</code>, or
|
||||
* <code>Books/Fic</code>...
|
||||
* </p>
|
||||
*
|
||||
* <pre class="prettyprint" >
|
||||
* <fieldType name="descendent_path" class="solr.TextField">
|
||||
* <analyzer type="index">
|
||||
* <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/" />
|
||||
* </analyzer>
|
||||
* <analyzer type="query">
|
||||
* <tokenizer class="solr.KeywordTokenizerFactory" />
|
||||
* </analyzer>
|
||||
* </fieldType>
|
||||
* </pre>
|
||||
* <p>
|
||||
* In this example however we see the oposite configuration, so that a query
|
||||
* for <code>Books/NonFic/Science/Physics</code> would match documents
|
||||
* containing <code>Books/NonFic</code>, <code>Books/NonFic/Science</code>,
|
||||
* or <code>Books/NonFic/Science/Physics</code>, but not
|
||||
* <code>Books/NonFic/Science/Physics/Theory</code> or
|
||||
* <code>Books/NonFic/Law</code>.
|
||||
* </p>
|
||||
* <pre class="prettyprint" >
|
||||
* <fieldType name="descendent_path" class="solr.TextField">
|
||||
* <analyzer type="index">
|
||||
* <tokenizer class="solr.KeywordTokenizerFactory" />
|
||||
* </analyzer>
|
||||
* <analyzer type="query">
|
||||
* <tokenizer class="solr.PathHierarchyTokenizerFactory" delimiter="/" />
|
||||
* </analyzer>
|
||||
* </fieldType>
|
||||
* </pre>
|
||||
*/
|
||||
public class PathHierarchyTokenizerFactory extends TokenizerFactory {
|
||||
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 7/15/12 1:57 AM */
|
||||
/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 8/6/12 11:57 AM */
|
||||
|
||||
package org.apache.lucene.analysis.standard;
|
||||
|
||||
|
@ -33,8 +33,8 @@ import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
|
|||
/**
|
||||
* This class is a scanner generated by
|
||||
* <a href="http://www.jflex.de/">JFlex</a> 1.5.0-SNAPSHOT
|
||||
* on 7/15/12 1:57 AM from the specification file
|
||||
* <tt>C:/cygwin/home/s/svn/lucene/dev/trunk/lucene/analysis/common/src/java/org/apache/lucene/analysis/standard/ClassicTokenizerImpl.jflex</tt>
|
||||
* on 8/6/12 11:57 AM from the specification file
|
||||
* <tt>/home/rmuir/workspace/lucene-trunk/lucene/analysis/common/src/java/org/apache/lucene/analysis/standard/ClassicTokenizerImpl.jflex</tt>
|
||||
*/
|
||||
class ClassicTokenizerImpl implements StandardTokenizerInterface {
|
||||
|
||||
|
@ -42,7 +42,7 @@ class ClassicTokenizerImpl implements StandardTokenizerInterface {
|
|||
public static final int YYEOF = -1;
|
||||
|
||||
/** initial size of the lookahead buffer */
|
||||
private static final int ZZ_BUFFERSIZE = 16384;
|
||||
private static final int ZZ_BUFFERSIZE = 4096;
|
||||
|
||||
/** lexical states */
|
||||
public static final int YYINITIAL = 0;
|
||||
|
|
|
@ -36,6 +36,7 @@ import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
|
|||
%function getNextToken
|
||||
%pack
|
||||
%char
|
||||
%buffer 4096
|
||||
|
||||
%{
|
||||
|
||||
|
|
|
@ -14,7 +14,7 @@
|
|||
* limitations under the License.
|
||||
*/
|
||||
|
||||
// Generated using ICU4J 49.1.0.0 on Thursday, July 26, 2012 10:22:01 PM UTC
|
||||
// Generated using ICU4J 49.1.0.0 on Monday, August 6, 2012 3:57:23 PM UTC
|
||||
// by org.apache.lucene.analysis.icu.GenerateJFlexSupplementaryMacros
|
||||
|
||||
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 7/26/12 6:22 PM */
|
||||
/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 8/6/12 11:57 AM */
|
||||
|
||||
package org.apache.lucene.analysis.standard;
|
||||
|
||||
|
@ -43,7 +43,7 @@ public final class StandardTokenizerImpl implements StandardTokenizerInterface {
|
|||
public static final int YYEOF = -1;
|
||||
|
||||
/** initial size of the lookahead buffer */
|
||||
private static final int ZZ_BUFFERSIZE = 16384;
|
||||
private static final int ZZ_BUFFERSIZE = 4096;
|
||||
|
||||
/** lexical states */
|
||||
public static final int YYINITIAL = 0;
|
||||
|
|
|
@ -44,8 +44,9 @@ import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
|
|||
%implements StandardTokenizerInterface
|
||||
%function getNextToken
|
||||
%char
|
||||
%buffer 4096
|
||||
|
||||
%include src/java/org/apache/lucene/analysis/standard/SUPPLEMENTARY.jflex-macro
|
||||
%include SUPPLEMENTARY.jflex-macro
|
||||
ALetter = ([\p{WB:ALetter}] | {ALetterSupp})
|
||||
Format = ([\p{WB:Format}] | {FormatSupp})
|
||||
Numeric = ([\p{WB:Numeric}] | {NumericSupp})
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 7/26/12 6:22 PM */
|
||||
/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 8/6/12 11:57 AM */
|
||||
|
||||
package org.apache.lucene.analysis.standard;
|
||||
|
||||
|
@ -46,7 +46,7 @@ public final class UAX29URLEmailTokenizerImpl implements StandardTokenizerInterf
|
|||
public static final int YYEOF = -1;
|
||||
|
||||
/** initial size of the lookahead buffer */
|
||||
private static final int ZZ_BUFFERSIZE = 16384;
|
||||
private static final int ZZ_BUFFERSIZE = 4096;
|
||||
|
||||
/** lexical states */
|
||||
public static final int YYINITIAL = 0;
|
||||
|
|
|
@ -47,8 +47,9 @@ import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
|
|||
%implements StandardTokenizerInterface
|
||||
%function getNextToken
|
||||
%char
|
||||
%buffer 4096
|
||||
|
||||
%include src/java/org/apache/lucene/analysis/standard/SUPPLEMENTARY.jflex-macro
|
||||
%include SUPPLEMENTARY.jflex-macro
|
||||
ALetter = ([\p{WB:ALetter}] | {ALetterSupp})
|
||||
Format = ([\p{WB:Format}] | {FormatSupp})
|
||||
Numeric = ([\p{WB:Numeric}] | {NumericSupp})
|
||||
|
@ -88,7 +89,7 @@ HiraganaEx = {Hiragana} ({Format} | {Extend})*
|
|||
// RFC-5321: Simple Mail Transfer Protocol
|
||||
// RFC-5322: Internet Message Format
|
||||
|
||||
%include src/java/org/apache/lucene/analysis/standard/ASCIITLD.jflex-macro
|
||||
%include ASCIITLD.jflex-macro
|
||||
|
||||
DomainLabel = [A-Za-z0-9] ([-A-Za-z0-9]* [A-Za-z0-9])?
|
||||
DomainNameStrict = {DomainLabel} ("." {DomainLabel})* {ASCIITLD}
|
||||
|
|
|
@ -0,0 +1,80 @@
|
|||
package org.apache.lucene.analysis.util;
|
||||
|
||||
/*
|
||||
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
* contributor license agreements. See the NOTICE file distributed with
|
||||
* this work for additional information regarding copyright ownership.
|
||||
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
* (the "License"); you may not use this file except in compliance with
|
||||
* the License. You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
import java.io.IOException;
|
||||
import java.io.InputStream;
|
||||
|
||||
/**
|
||||
* Simple {@link ResourceLoader} that uses {@link ClassLoader#getResourceAsStream(String)}
|
||||
* and {@link Class#forName(String,boolean,ClassLoader)} to open resources and
|
||||
* classes, respectively.
|
||||
*/
|
||||
public final class ClasspathResourceLoader implements ResourceLoader {
|
||||
private final Class<?> clazz;
|
||||
private final ClassLoader loader;
|
||||
|
||||
/**
|
||||
* Creates an instance using the context classloader to load Resources and classes.
|
||||
* Resource paths must be absolute.
|
||||
*/
|
||||
public ClasspathResourceLoader() {
|
||||
this(Thread.currentThread().getContextClassLoader());
|
||||
}
|
||||
|
||||
/**
|
||||
* Creates an instance using the given classloader to load Resources and classes.
|
||||
* Resource paths must be absolute.
|
||||
*/
|
||||
public ClasspathResourceLoader(ClassLoader loader) {
|
||||
this(null, loader);
|
||||
}
|
||||
|
||||
/**
|
||||
* Creates an instance using the context classloader to load Resources and classes
|
||||
* Resources are resolved relative to the given class, if path is not absolute.
|
||||
*/
|
||||
public ClasspathResourceLoader(Class<?> clazz) {
|
||||
this(clazz, clazz.getClassLoader());
|
||||
}
|
||||
|
||||
private ClasspathResourceLoader(Class<?> clazz, ClassLoader loader) {
|
||||
this.clazz = clazz;
|
||||
this.loader = loader;
|
||||
}
|
||||
|
||||
@Override
|
||||
public InputStream openResource(String resource) throws IOException {
|
||||
final InputStream stream = (clazz != null) ?
|
||||
clazz.getResourceAsStream(resource) :
|
||||
loader.getResourceAsStream(resource);
|
||||
if (stream == null)
|
||||
throw new IOException("Resource not found: " + resource);
|
||||
return stream;
|
||||
}
|
||||
|
||||
@Override
|
||||
public <T> T newInstance(String cname, Class<T> expectedType) {
|
||||
try {
|
||||
final Class<? extends T> clazz = Class.forName(cname, true, loader).asSubclass(expectedType);
|
||||
return clazz.newInstance();
|
||||
} catch (Exception e) {
|
||||
throw new RuntimeException("Cannot instantiate class: " + cname, e);
|
||||
}
|
||||
}
|
||||
}
|
|
@ -1,4 +1,4 @@
|
|||
package org.apache.lucene.analysis.fr;
|
||||
package org.apache.lucene.analysis.util;
|
||||
|
||||
/*
|
||||
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
|
@ -18,13 +18,11 @@ package org.apache.lucene.analysis.fr;
|
|||
*/
|
||||
|
||||
import java.io.IOException;
|
||||
import java.util.Arrays;
|
||||
|
||||
import org.apache.lucene.analysis.TokenFilter;
|
||||
import org.apache.lucene.analysis.TokenStream;
|
||||
import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
|
||||
import org.apache.lucene.analysis.util.CharArraySet;
|
||||
import org.apache.lucene.util.Version;
|
||||
|
||||
/**
|
||||
* Removes elisions from a {@link TokenStream}. For example, "l'avion" (the plane) will be
|
||||
|
@ -33,31 +31,17 @@ import org.apache.lucene.util.Version;
|
|||
* @see <a href="http://fr.wikipedia.org/wiki/%C3%89lision">Elision in Wikipedia</a>
|
||||
*/
|
||||
public final class ElisionFilter extends TokenFilter {
|
||||
private CharArraySet articles = CharArraySet.EMPTY_SET;
|
||||
private final CharArraySet articles;
|
||||
private final CharTermAttribute termAtt = addAttribute(CharTermAttribute.class);
|
||||
private static final CharArraySet DEFAULT_ARTICLES = CharArraySet.unmodifiableSet(
|
||||
new CharArraySet(Version.LUCENE_CURRENT, Arrays.asList(
|
||||
"l", "m", "t", "qu", "n", "s", "j"), true));
|
||||
|
||||
private static char[] apostrophes = {'\'', '\u2019'};
|
||||
|
||||
/**
|
||||
* Constructs an elision filter with standard stop words
|
||||
*/
|
||||
public ElisionFilter(Version matchVersion, TokenStream input) {
|
||||
this(matchVersion, input, DEFAULT_ARTICLES);
|
||||
}
|
||||
|
||||
/**
|
||||
* Constructs an elision filter with a Set of stop words
|
||||
* @param matchVersion the lucene backwards compatibility version
|
||||
* @param input the source {@link TokenStream}
|
||||
* @param articles a set of stopword articles
|
||||
*/
|
||||
public ElisionFilter(Version matchVersion, TokenStream input, CharArraySet articles) {
|
||||
public ElisionFilter(TokenStream input, CharArraySet articles) {
|
||||
super(input);
|
||||
this.articles = CharArraySet.unmodifiableSet(
|
||||
new CharArraySet(matchVersion, articles, true));
|
||||
this.articles = articles;
|
||||
}
|
||||
|
||||
/**
|
||||
|
@ -69,22 +53,18 @@ public final class ElisionFilter extends TokenFilter {
|
|||
char[] termBuffer = termAtt.buffer();
|
||||
int termLength = termAtt.length();
|
||||
|
||||
int minPoz = Integer.MAX_VALUE;
|
||||
for (int i = 0; i < apostrophes.length; i++) {
|
||||
char apos = apostrophes[i];
|
||||
// The equivalent of String.indexOf(ch)
|
||||
for (int poz = 0; poz < termLength ; poz++) {
|
||||
if (termBuffer[poz] == apos) {
|
||||
minPoz = Math.min(poz, minPoz);
|
||||
int index = -1;
|
||||
for (int i = 0; i < termLength; i++) {
|
||||
char ch = termBuffer[i];
|
||||
if (ch == '\'' || ch == '\u2019') {
|
||||
index = i;
|
||||
break;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// An apostrophe has been found. If the prefix is an article strip it off.
|
||||
if (minPoz != Integer.MAX_VALUE
|
||||
&& articles.contains(termAtt.buffer(), 0, minPoz)) {
|
||||
termAtt.copyBuffer(termAtt.buffer(), minPoz + 1, termAtt.length() - (minPoz + 1));
|
||||
if (index >= 0 && articles.contains(termBuffer, 0, index)) {
|
||||
termAtt.copyBuffer(termBuffer, index + 1, termLength - (index + 1));
|
||||
}
|
||||
|
||||
return true;
|
|
@ -1,4 +1,4 @@
|
|||
package org.apache.lucene.analysis.fr;
|
||||
package org.apache.lucene.analysis.util;
|
||||
|
||||
/*
|
||||
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
|
@ -17,10 +17,9 @@ package org.apache.lucene.analysis.fr;
|
|||
* limitations under the License.
|
||||
*/
|
||||
|
||||
import org.apache.lucene.analysis.util.*;
|
||||
|
||||
import java.io.IOException;
|
||||
import org.apache.lucene.analysis.TokenStream;
|
||||
import org.apache.lucene.analysis.fr.FrenchAnalyzer;
|
||||
|
||||
/**
|
||||
* Factory for {@link ElisionFilter}.
|
||||
|
@ -46,12 +45,13 @@ public class ElisionFilterFactory extends TokenFilterFactory implements Resource
|
|||
if (articlesFile != null) {
|
||||
articles = getWordSet(loader, articlesFile, ignoreCase);
|
||||
}
|
||||
if (articles == null) {
|
||||
articles = FrenchAnalyzer.DEFAULT_ARTICLES;
|
||||
}
|
||||
}
|
||||
|
||||
public ElisionFilter create(TokenStream input) {
|
||||
assureMatchVersion();
|
||||
return articles == null ? new ElisionFilter(luceneMatchVersion,input) :
|
||||
new ElisionFilter(luceneMatchVersion,input,articles);
|
||||
return new ElisionFilter(input, articles);
|
||||
}
|
||||
}
|
||||
|
|
@ -0,0 +1,94 @@
|
|||
package org.apache.lucene.analysis.util;
|
||||
|
||||
/*
|
||||
* Licensed to the Apache Software Foundation (ASF) under one or more
|
||||
* contributor license agreements. See the NOTICE file distributed with
|
||||
* this work for additional information regarding copyright ownership.
|
||||
* The ASF licenses this file to You under the Apache License, Version 2.0
|
||||
* (the "License"); you may not use this file except in compliance with
|
||||
* the License. You may obtain a copy of the License at
|
||||
*
|
||||
* http://www.apache.org/licenses/LICENSE-2.0
|
||||
*
|
||||
* Unless required by applicable law or agreed to in writing, software
|
||||
* distributed under the License is distributed on an "AS IS" BASIS,
|
||||
* WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
||||
* See the License for the specific language governing permissions and
|
||||
* limitations under the License.
|
||||
*/
|
||||
|
||||
import java.io.File;
|
||||
import java.io.FileInputStream;
|
||||
import java.io.FileNotFoundException;
|
||||
import java.io.IOException;
|
||||
import java.io.InputStream;
|
||||
|
||||
/**
|
||||
* Simple {@link ResourceLoader} that opens resource files
|
||||
* from the local file system, optionally resolving against
|
||||
* a base directory.
|
||||
*
|
||||
* <p>This loader wraps a delegate {@link ResourceLoader}
|
||||
* that is used to resolve all files, the current base directory
|
||||
* does not contain. {@link #newInstance} is always resolved
|
||||
* against the delegate, as a {@link ClassLoader} is needed.
|
||||
*
|
||||
* <p>You can chain several {@code FilesystemResourceLoader}s
|
||||
* to allow lookup of files in more than one base directory.
|
||||
*/
|
||||
public final class FilesystemResourceLoader implements ResourceLoader {
|
||||
private final File baseDirectory;
|
||||
private final ResourceLoader delegate;
|
||||
|
||||
/**
|
||||
* Creates a resource loader that requires absolute filenames or relative to CWD
|
||||
* to resolve resources. Files not found in file system and class lookups
|
||||
* are delegated to context classloader.
|
||||
*/
|
||||
public FilesystemResourceLoader() {
|
||||
this((File) null);
|
||||
}
|
||||
|
||||
/**
|
||||
* Creates a resource loader that resolves resources against the given
|
||||
* base directory (may be {@code null} to refer to CWD).
|
||||
* Files not found in file system and class lookups are delegated to context
|
||||
* classloader.
|
||||
*/
|
||||
public FilesystemResourceLoader(File baseDirectory) {
|
||||
this(baseDirectory, new ClasspathResourceLoader());
|
||||
}
|
||||
|
||||
/**
|
||||
* Creates a resource loader that resolves resources against the given
|
||||
* base directory (may be {@code null} to refer to CWD).
|
||||
* Files not found in file system and class lookups are delegated
|
||||
* to the given delegate {@link ResourceLoader}.
|
||||
*/
|
||||
public FilesystemResourceLoader(File baseDirectory, ResourceLoader delegate) {
|
||||
if (baseDirectory != null && !baseDirectory.isDirectory())
|
||||
throw new IllegalArgumentException("baseDirectory is not a directory or null");
|
||||
if (delegate == null)
|
||||
throw new IllegalArgumentException("delegate ResourceLoader may not be null");
|
||||
this.baseDirectory = baseDirectory;
|
||||
this.delegate = delegate;
|
||||
}
|
||||
|
||||
@Override
|
||||
public InputStream openResource(String resource) throws IOException {
|
||||
try {
|
||||
File file = new File (resource);
|
||||
if (baseDirectory != null && !file.isAbsolute()) {
|
||||
file = new File(baseDirectory, resource);
|
||||
}
|
||||
return new FileInputStream(file);
|
||||
} catch (FileNotFoundException fnfe) {
|
||||
return delegate.openResource(resource);
|
||||
}
|
||||
}
|
||||
|
||||
@Override
|
||||
public <T> T newInstance(String cname, Class<T> expectedType) {
|
||||
return delegate.newInstance(cname, expectedType);
|
||||
}
|
||||
}
|
|
@ -1,4 +1,4 @@
|
|||
/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 7/15/12 1:57 AM */
|
||||
/* The following code was generated by JFlex 1.5.0-SNAPSHOT on 8/6/12 11:57 AM */
|
||||
|
||||
package org.apache.lucene.analysis.wikipedia;
|
||||
|
||||
|
@ -25,8 +25,8 @@ import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
|
|||
/**
|
||||
* This class is a scanner generated by
|
||||
* <a href="http://www.jflex.de/">JFlex</a> 1.5.0-SNAPSHOT
|
||||
* on 7/15/12 1:57 AM from the specification file
|
||||
* <tt>C:/cygwin/home/s/svn/lucene/dev/trunk/lucene/analysis/common/src/java/org/apache/lucene/analysis/wikipedia/WikipediaTokenizerImpl.jflex</tt>
|
||||
* on 8/6/12 11:57 AM from the specification file
|
||||
* <tt>/home/rmuir/workspace/lucene-trunk/lucene/analysis/common/src/java/org/apache/lucene/analysis/wikipedia/WikipediaTokenizerImpl.jflex</tt>
|
||||
*/
|
||||
class WikipediaTokenizerImpl {
|
||||
|
||||
|
@ -34,7 +34,7 @@ class WikipediaTokenizerImpl {
|
|||
public static final int YYEOF = -1;
|
||||
|
||||
/** initial size of the lookahead buffer */
|
||||
private static final int ZZ_BUFFERSIZE = 16384;
|
||||
private static final int ZZ_BUFFERSIZE = 4096;
|
||||
|
||||
/** lexical states */
|
||||
public static final int THREE_SINGLE_QUOTES_STATE = 10;
|
||||
|
|
|
@ -27,6 +27,7 @@ import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
|
|||
%function getNextToken
|
||||
%pack
|
||||
%char
|
||||
%buffer 4096
|
||||
|
||||
%{
|
||||
|
||||
|
|
|
@ -1,62 +1,69 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class DanishStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "hed", -1, 1, "", this),
|
||||
new Among ( "ethed", 0, 1, "", this),
|
||||
new Among ( "ered", -1, 1, "", this),
|
||||
new Among ( "e", -1, 1, "", this),
|
||||
new Among ( "erede", 3, 1, "", this),
|
||||
new Among ( "ende", 3, 1, "", this),
|
||||
new Among ( "erende", 5, 1, "", this),
|
||||
new Among ( "ene", 3, 1, "", this),
|
||||
new Among ( "erne", 3, 1, "", this),
|
||||
new Among ( "ere", 3, 1, "", this),
|
||||
new Among ( "en", -1, 1, "", this),
|
||||
new Among ( "heden", 10, 1, "", this),
|
||||
new Among ( "eren", 10, 1, "", this),
|
||||
new Among ( "er", -1, 1, "", this),
|
||||
new Among ( "heder", 13, 1, "", this),
|
||||
new Among ( "erer", 13, 1, "", this),
|
||||
new Among ( "s", -1, 2, "", this),
|
||||
new Among ( "heds", 16, 1, "", this),
|
||||
new Among ( "es", 16, 1, "", this),
|
||||
new Among ( "endes", 18, 1, "", this),
|
||||
new Among ( "erendes", 19, 1, "", this),
|
||||
new Among ( "enes", 18, 1, "", this),
|
||||
new Among ( "ernes", 18, 1, "", this),
|
||||
new Among ( "eres", 18, 1, "", this),
|
||||
new Among ( "ens", 16, 1, "", this),
|
||||
new Among ( "hedens", 24, 1, "", this),
|
||||
new Among ( "erens", 24, 1, "", this),
|
||||
new Among ( "ers", 16, 1, "", this),
|
||||
new Among ( "ets", 16, 1, "", this),
|
||||
new Among ( "erets", 28, 1, "", this),
|
||||
new Among ( "et", -1, 1, "", this),
|
||||
new Among ( "eret", 30, 1, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static DanishStemmer methodObject = new DanishStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "hed", -1, 1, "", methodObject ),
|
||||
new Among ( "ethed", 0, 1, "", methodObject ),
|
||||
new Among ( "ered", -1, 1, "", methodObject ),
|
||||
new Among ( "e", -1, 1, "", methodObject ),
|
||||
new Among ( "erede", 3, 1, "", methodObject ),
|
||||
new Among ( "ende", 3, 1, "", methodObject ),
|
||||
new Among ( "erende", 5, 1, "", methodObject ),
|
||||
new Among ( "ene", 3, 1, "", methodObject ),
|
||||
new Among ( "erne", 3, 1, "", methodObject ),
|
||||
new Among ( "ere", 3, 1, "", methodObject ),
|
||||
new Among ( "en", -1, 1, "", methodObject ),
|
||||
new Among ( "heden", 10, 1, "", methodObject ),
|
||||
new Among ( "eren", 10, 1, "", methodObject ),
|
||||
new Among ( "er", -1, 1, "", methodObject ),
|
||||
new Among ( "heder", 13, 1, "", methodObject ),
|
||||
new Among ( "erer", 13, 1, "", methodObject ),
|
||||
new Among ( "s", -1, 2, "", methodObject ),
|
||||
new Among ( "heds", 16, 1, "", methodObject ),
|
||||
new Among ( "es", 16, 1, "", methodObject ),
|
||||
new Among ( "endes", 18, 1, "", methodObject ),
|
||||
new Among ( "erendes", 19, 1, "", methodObject ),
|
||||
new Among ( "enes", 18, 1, "", methodObject ),
|
||||
new Among ( "ernes", 18, 1, "", methodObject ),
|
||||
new Among ( "eres", 18, 1, "", methodObject ),
|
||||
new Among ( "ens", 16, 1, "", methodObject ),
|
||||
new Among ( "hedens", 24, 1, "", methodObject ),
|
||||
new Among ( "erens", 24, 1, "", methodObject ),
|
||||
new Among ( "ers", 16, 1, "", methodObject ),
|
||||
new Among ( "ets", 16, 1, "", methodObject ),
|
||||
new Among ( "erets", 28, 1, "", methodObject ),
|
||||
new Among ( "et", -1, 1, "", methodObject ),
|
||||
new Among ( "eret", 30, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "gd", -1, -1, "", this),
|
||||
new Among ( "dt", -1, -1, "", this),
|
||||
new Among ( "gt", -1, -1, "", this),
|
||||
new Among ( "kt", -1, -1, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "gd", -1, -1, "", methodObject ),
|
||||
new Among ( "dt", -1, -1, "", methodObject ),
|
||||
new Among ( "gt", -1, -1, "", methodObject ),
|
||||
new Among ( "kt", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "ig", -1, 1, "", this),
|
||||
new Among ( "lig", 0, 1, "", this),
|
||||
new Among ( "elig", 1, 1, "", this),
|
||||
new Among ( "els", -1, 1, "", this),
|
||||
new Among ( "l\u00F8st", -1, 2, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "ig", -1, 1, "", methodObject ),
|
||||
new Among ( "lig", 0, 1, "", methodObject ),
|
||||
new Among ( "elig", 1, 1, "", methodObject ),
|
||||
new Among ( "els", -1, 1, "", methodObject ),
|
||||
new Among ( "l\u00F8st", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 48, 0, 128 };
|
||||
|
@ -65,7 +72,7 @@ public class DanishStemmer extends SnowballProgram {
|
|||
|
||||
private int I_x;
|
||||
private int I_p1;
|
||||
private StringBuilder S_ch = new StringBuilder();
|
||||
private java.lang.StringBuilder S_ch = new java.lang.StringBuilder();
|
||||
|
||||
private void copy_from(DanishStemmer other) {
|
||||
I_x = other.I_x;
|
||||
|
@ -419,5 +426,14 @@ public class DanishStemmer extends SnowballProgram {
|
|||
cursor = limit_backward; return true;
|
||||
}
|
||||
|
||||
}
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof DanishStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return DanishStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
|
|
@ -1,62 +1,69 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class DutchStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "", -1, 6, "", this),
|
||||
new Among ( "\u00E1", 0, 1, "", this),
|
||||
new Among ( "\u00E4", 0, 1, "", this),
|
||||
new Among ( "\u00E9", 0, 2, "", this),
|
||||
new Among ( "\u00EB", 0, 2, "", this),
|
||||
new Among ( "\u00ED", 0, 3, "", this),
|
||||
new Among ( "\u00EF", 0, 3, "", this),
|
||||
new Among ( "\u00F3", 0, 4, "", this),
|
||||
new Among ( "\u00F6", 0, 4, "", this),
|
||||
new Among ( "\u00FA", 0, 5, "", this),
|
||||
new Among ( "\u00FC", 0, 5, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static DutchStemmer methodObject = new DutchStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "", -1, 6, "", methodObject ),
|
||||
new Among ( "\u00E1", 0, 1, "", methodObject ),
|
||||
new Among ( "\u00E4", 0, 1, "", methodObject ),
|
||||
new Among ( "\u00E9", 0, 2, "", methodObject ),
|
||||
new Among ( "\u00EB", 0, 2, "", methodObject ),
|
||||
new Among ( "\u00ED", 0, 3, "", methodObject ),
|
||||
new Among ( "\u00EF", 0, 3, "", methodObject ),
|
||||
new Among ( "\u00F3", 0, 4, "", methodObject ),
|
||||
new Among ( "\u00F6", 0, 4, "", methodObject ),
|
||||
new Among ( "\u00FA", 0, 5, "", methodObject ),
|
||||
new Among ( "\u00FC", 0, 5, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "", -1, 3, "", this),
|
||||
new Among ( "I", 0, 2, "", this),
|
||||
new Among ( "Y", 0, 1, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "", -1, 3, "", methodObject ),
|
||||
new Among ( "I", 0, 2, "", methodObject ),
|
||||
new Among ( "Y", 0, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "dd", -1, -1, "", this),
|
||||
new Among ( "kk", -1, -1, "", this),
|
||||
new Among ( "tt", -1, -1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "dd", -1, -1, "", methodObject ),
|
||||
new Among ( "kk", -1, -1, "", methodObject ),
|
||||
new Among ( "tt", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "ene", -1, 2, "", this),
|
||||
new Among ( "se", -1, 3, "", this),
|
||||
new Among ( "en", -1, 2, "", this),
|
||||
new Among ( "heden", 2, 1, "", this),
|
||||
new Among ( "s", -1, 3, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "ene", -1, 2, "", methodObject ),
|
||||
new Among ( "se", -1, 3, "", methodObject ),
|
||||
new Among ( "en", -1, 2, "", methodObject ),
|
||||
new Among ( "heden", 2, 1, "", methodObject ),
|
||||
new Among ( "s", -1, 3, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "end", -1, 1, "", this),
|
||||
new Among ( "ig", -1, 2, "", this),
|
||||
new Among ( "ing", -1, 1, "", this),
|
||||
new Among ( "lijk", -1, 3, "", this),
|
||||
new Among ( "baar", -1, 4, "", this),
|
||||
new Among ( "bar", -1, 5, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "end", -1, 1, "", methodObject ),
|
||||
new Among ( "ig", -1, 2, "", methodObject ),
|
||||
new Among ( "ing", -1, 1, "", methodObject ),
|
||||
new Among ( "lijk", -1, 3, "", methodObject ),
|
||||
new Among ( "baar", -1, 4, "", methodObject ),
|
||||
new Among ( "bar", -1, 5, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "aa", -1, -1, "", this),
|
||||
new Among ( "ee", -1, -1, "", this),
|
||||
new Among ( "oo", -1, -1, "", this),
|
||||
new Among ( "uu", -1, -1, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "aa", -1, -1, "", methodObject ),
|
||||
new Among ( "ee", -1, -1, "", methodObject ),
|
||||
new Among ( "oo", -1, -1, "", methodObject ),
|
||||
new Among ( "uu", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 128 };
|
||||
|
@ -833,5 +840,15 @@ public class DutchStemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof DutchStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return DutchStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,155 +1,162 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class EnglishStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "arsen", -1, -1, "", this),
|
||||
new Among ( "commun", -1, -1, "", this),
|
||||
new Among ( "gener", -1, -1, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static EnglishStemmer methodObject = new EnglishStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "arsen", -1, -1, "", methodObject ),
|
||||
new Among ( "commun", -1, -1, "", methodObject ),
|
||||
new Among ( "gener", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "'", -1, 1, "", this),
|
||||
new Among ( "'s'", 0, 1, "", this),
|
||||
new Among ( "'s", -1, 1, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "'", -1, 1, "", methodObject ),
|
||||
new Among ( "'s'", 0, 1, "", methodObject ),
|
||||
new Among ( "'s", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "ied", -1, 2, "", this),
|
||||
new Among ( "s", -1, 3, "", this),
|
||||
new Among ( "ies", 1, 2, "", this),
|
||||
new Among ( "sses", 1, 1, "", this),
|
||||
new Among ( "ss", 1, -1, "", this),
|
||||
new Among ( "us", 1, -1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "ied", -1, 2, "", methodObject ),
|
||||
new Among ( "s", -1, 3, "", methodObject ),
|
||||
new Among ( "ies", 1, 2, "", methodObject ),
|
||||
new Among ( "sses", 1, 1, "", methodObject ),
|
||||
new Among ( "ss", 1, -1, "", methodObject ),
|
||||
new Among ( "us", 1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "", -1, 3, "", this),
|
||||
new Among ( "bb", 0, 2, "", this),
|
||||
new Among ( "dd", 0, 2, "", this),
|
||||
new Among ( "ff", 0, 2, "", this),
|
||||
new Among ( "gg", 0, 2, "", this),
|
||||
new Among ( "bl", 0, 1, "", this),
|
||||
new Among ( "mm", 0, 2, "", this),
|
||||
new Among ( "nn", 0, 2, "", this),
|
||||
new Among ( "pp", 0, 2, "", this),
|
||||
new Among ( "rr", 0, 2, "", this),
|
||||
new Among ( "at", 0, 1, "", this),
|
||||
new Among ( "tt", 0, 2, "", this),
|
||||
new Among ( "iz", 0, 1, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "", -1, 3, "", methodObject ),
|
||||
new Among ( "bb", 0, 2, "", methodObject ),
|
||||
new Among ( "dd", 0, 2, "", methodObject ),
|
||||
new Among ( "ff", 0, 2, "", methodObject ),
|
||||
new Among ( "gg", 0, 2, "", methodObject ),
|
||||
new Among ( "bl", 0, 1, "", methodObject ),
|
||||
new Among ( "mm", 0, 2, "", methodObject ),
|
||||
new Among ( "nn", 0, 2, "", methodObject ),
|
||||
new Among ( "pp", 0, 2, "", methodObject ),
|
||||
new Among ( "rr", 0, 2, "", methodObject ),
|
||||
new Among ( "at", 0, 1, "", methodObject ),
|
||||
new Among ( "tt", 0, 2, "", methodObject ),
|
||||
new Among ( "iz", 0, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "ed", -1, 2, "", this),
|
||||
new Among ( "eed", 0, 1, "", this),
|
||||
new Among ( "ing", -1, 2, "", this),
|
||||
new Among ( "edly", -1, 2, "", this),
|
||||
new Among ( "eedly", 3, 1, "", this),
|
||||
new Among ( "ingly", -1, 2, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "ed", -1, 2, "", methodObject ),
|
||||
new Among ( "eed", 0, 1, "", methodObject ),
|
||||
new Among ( "ing", -1, 2, "", methodObject ),
|
||||
new Among ( "edly", -1, 2, "", methodObject ),
|
||||
new Among ( "eedly", 3, 1, "", methodObject ),
|
||||
new Among ( "ingly", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "anci", -1, 3, "", this),
|
||||
new Among ( "enci", -1, 2, "", this),
|
||||
new Among ( "ogi", -1, 13, "", this),
|
||||
new Among ( "li", -1, 16, "", this),
|
||||
new Among ( "bli", 3, 12, "", this),
|
||||
new Among ( "abli", 4, 4, "", this),
|
||||
new Among ( "alli", 3, 8, "", this),
|
||||
new Among ( "fulli", 3, 14, "", this),
|
||||
new Among ( "lessli", 3, 15, "", this),
|
||||
new Among ( "ousli", 3, 10, "", this),
|
||||
new Among ( "entli", 3, 5, "", this),
|
||||
new Among ( "aliti", -1, 8, "", this),
|
||||
new Among ( "biliti", -1, 12, "", this),
|
||||
new Among ( "iviti", -1, 11, "", this),
|
||||
new Among ( "tional", -1, 1, "", this),
|
||||
new Among ( "ational", 14, 7, "", this),
|
||||
new Among ( "alism", -1, 8, "", this),
|
||||
new Among ( "ation", -1, 7, "", this),
|
||||
new Among ( "ization", 17, 6, "", this),
|
||||
new Among ( "izer", -1, 6, "", this),
|
||||
new Among ( "ator", -1, 7, "", this),
|
||||
new Among ( "iveness", -1, 11, "", this),
|
||||
new Among ( "fulness", -1, 9, "", this),
|
||||
new Among ( "ousness", -1, 10, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "anci", -1, 3, "", methodObject ),
|
||||
new Among ( "enci", -1, 2, "", methodObject ),
|
||||
new Among ( "ogi", -1, 13, "", methodObject ),
|
||||
new Among ( "li", -1, 16, "", methodObject ),
|
||||
new Among ( "bli", 3, 12, "", methodObject ),
|
||||
new Among ( "abli", 4, 4, "", methodObject ),
|
||||
new Among ( "alli", 3, 8, "", methodObject ),
|
||||
new Among ( "fulli", 3, 14, "", methodObject ),
|
||||
new Among ( "lessli", 3, 15, "", methodObject ),
|
||||
new Among ( "ousli", 3, 10, "", methodObject ),
|
||||
new Among ( "entli", 3, 5, "", methodObject ),
|
||||
new Among ( "aliti", -1, 8, "", methodObject ),
|
||||
new Among ( "biliti", -1, 12, "", methodObject ),
|
||||
new Among ( "iviti", -1, 11, "", methodObject ),
|
||||
new Among ( "tional", -1, 1, "", methodObject ),
|
||||
new Among ( "ational", 14, 7, "", methodObject ),
|
||||
new Among ( "alism", -1, 8, "", methodObject ),
|
||||
new Among ( "ation", -1, 7, "", methodObject ),
|
||||
new Among ( "ization", 17, 6, "", methodObject ),
|
||||
new Among ( "izer", -1, 6, "", methodObject ),
|
||||
new Among ( "ator", -1, 7, "", methodObject ),
|
||||
new Among ( "iveness", -1, 11, "", methodObject ),
|
||||
new Among ( "fulness", -1, 9, "", methodObject ),
|
||||
new Among ( "ousness", -1, 10, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_6[] = {
|
||||
new Among ( "icate", -1, 4, "", this),
|
||||
new Among ( "ative", -1, 6, "", this),
|
||||
new Among ( "alize", -1, 3, "", this),
|
||||
new Among ( "iciti", -1, 4, "", this),
|
||||
new Among ( "ical", -1, 4, "", this),
|
||||
new Among ( "tional", -1, 1, "", this),
|
||||
new Among ( "ational", 5, 2, "", this),
|
||||
new Among ( "ful", -1, 5, "", this),
|
||||
new Among ( "ness", -1, 5, "", this)
|
||||
private final static Among a_6[] = {
|
||||
new Among ( "icate", -1, 4, "", methodObject ),
|
||||
new Among ( "ative", -1, 6, "", methodObject ),
|
||||
new Among ( "alize", -1, 3, "", methodObject ),
|
||||
new Among ( "iciti", -1, 4, "", methodObject ),
|
||||
new Among ( "ical", -1, 4, "", methodObject ),
|
||||
new Among ( "tional", -1, 1, "", methodObject ),
|
||||
new Among ( "ational", 5, 2, "", methodObject ),
|
||||
new Among ( "ful", -1, 5, "", methodObject ),
|
||||
new Among ( "ness", -1, 5, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_7[] = {
|
||||
new Among ( "ic", -1, 1, "", this),
|
||||
new Among ( "ance", -1, 1, "", this),
|
||||
new Among ( "ence", -1, 1, "", this),
|
||||
new Among ( "able", -1, 1, "", this),
|
||||
new Among ( "ible", -1, 1, "", this),
|
||||
new Among ( "ate", -1, 1, "", this),
|
||||
new Among ( "ive", -1, 1, "", this),
|
||||
new Among ( "ize", -1, 1, "", this),
|
||||
new Among ( "iti", -1, 1, "", this),
|
||||
new Among ( "al", -1, 1, "", this),
|
||||
new Among ( "ism", -1, 1, "", this),
|
||||
new Among ( "ion", -1, 2, "", this),
|
||||
new Among ( "er", -1, 1, "", this),
|
||||
new Among ( "ous", -1, 1, "", this),
|
||||
new Among ( "ant", -1, 1, "", this),
|
||||
new Among ( "ent", -1, 1, "", this),
|
||||
new Among ( "ment", 15, 1, "", this),
|
||||
new Among ( "ement", 16, 1, "", this)
|
||||
private final static Among a_7[] = {
|
||||
new Among ( "ic", -1, 1, "", methodObject ),
|
||||
new Among ( "ance", -1, 1, "", methodObject ),
|
||||
new Among ( "ence", -1, 1, "", methodObject ),
|
||||
new Among ( "able", -1, 1, "", methodObject ),
|
||||
new Among ( "ible", -1, 1, "", methodObject ),
|
||||
new Among ( "ate", -1, 1, "", methodObject ),
|
||||
new Among ( "ive", -1, 1, "", methodObject ),
|
||||
new Among ( "ize", -1, 1, "", methodObject ),
|
||||
new Among ( "iti", -1, 1, "", methodObject ),
|
||||
new Among ( "al", -1, 1, "", methodObject ),
|
||||
new Among ( "ism", -1, 1, "", methodObject ),
|
||||
new Among ( "ion", -1, 2, "", methodObject ),
|
||||
new Among ( "er", -1, 1, "", methodObject ),
|
||||
new Among ( "ous", -1, 1, "", methodObject ),
|
||||
new Among ( "ant", -1, 1, "", methodObject ),
|
||||
new Among ( "ent", -1, 1, "", methodObject ),
|
||||
new Among ( "ment", 15, 1, "", methodObject ),
|
||||
new Among ( "ement", 16, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_8[] = {
|
||||
new Among ( "e", -1, 1, "", this),
|
||||
new Among ( "l", -1, 2, "", this)
|
||||
private final static Among a_8[] = {
|
||||
new Among ( "e", -1, 1, "", methodObject ),
|
||||
new Among ( "l", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_9[] = {
|
||||
new Among ( "succeed", -1, -1, "", this),
|
||||
new Among ( "proceed", -1, -1, "", this),
|
||||
new Among ( "exceed", -1, -1, "", this),
|
||||
new Among ( "canning", -1, -1, "", this),
|
||||
new Among ( "inning", -1, -1, "", this),
|
||||
new Among ( "earring", -1, -1, "", this),
|
||||
new Among ( "herring", -1, -1, "", this),
|
||||
new Among ( "outing", -1, -1, "", this)
|
||||
private final static Among a_9[] = {
|
||||
new Among ( "succeed", -1, -1, "", methodObject ),
|
||||
new Among ( "proceed", -1, -1, "", methodObject ),
|
||||
new Among ( "exceed", -1, -1, "", methodObject ),
|
||||
new Among ( "canning", -1, -1, "", methodObject ),
|
||||
new Among ( "inning", -1, -1, "", methodObject ),
|
||||
new Among ( "earring", -1, -1, "", methodObject ),
|
||||
new Among ( "herring", -1, -1, "", methodObject ),
|
||||
new Among ( "outing", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_10[] = {
|
||||
new Among ( "andes", -1, -1, "", this),
|
||||
new Among ( "atlas", -1, -1, "", this),
|
||||
new Among ( "bias", -1, -1, "", this),
|
||||
new Among ( "cosmos", -1, -1, "", this),
|
||||
new Among ( "dying", -1, 3, "", this),
|
||||
new Among ( "early", -1, 9, "", this),
|
||||
new Among ( "gently", -1, 7, "", this),
|
||||
new Among ( "howe", -1, -1, "", this),
|
||||
new Among ( "idly", -1, 6, "", this),
|
||||
new Among ( "lying", -1, 4, "", this),
|
||||
new Among ( "news", -1, -1, "", this),
|
||||
new Among ( "only", -1, 10, "", this),
|
||||
new Among ( "singly", -1, 11, "", this),
|
||||
new Among ( "skies", -1, 2, "", this),
|
||||
new Among ( "skis", -1, 1, "", this),
|
||||
new Among ( "sky", -1, -1, "", this),
|
||||
new Among ( "tying", -1, 5, "", this),
|
||||
new Among ( "ugly", -1, 8, "", this)
|
||||
private final static Among a_10[] = {
|
||||
new Among ( "andes", -1, -1, "", methodObject ),
|
||||
new Among ( "atlas", -1, -1, "", methodObject ),
|
||||
new Among ( "bias", -1, -1, "", methodObject ),
|
||||
new Among ( "cosmos", -1, -1, "", methodObject ),
|
||||
new Among ( "dying", -1, 3, "", methodObject ),
|
||||
new Among ( "early", -1, 9, "", methodObject ),
|
||||
new Among ( "gently", -1, 7, "", methodObject ),
|
||||
new Among ( "howe", -1, -1, "", methodObject ),
|
||||
new Among ( "idly", -1, 6, "", methodObject ),
|
||||
new Among ( "lying", -1, 4, "", methodObject ),
|
||||
new Among ( "news", -1, -1, "", methodObject ),
|
||||
new Among ( "only", -1, 10, "", methodObject ),
|
||||
new Among ( "singly", -1, 11, "", methodObject ),
|
||||
new Among ( "skies", -1, 2, "", methodObject ),
|
||||
new Among ( "skis", -1, 1, "", methodObject ),
|
||||
new Among ( "sky", -1, -1, "", methodObject ),
|
||||
new Among ( "tying", -1, 5, "", methodObject ),
|
||||
new Among ( "ugly", -1, 8, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 1 };
|
||||
|
@ -1310,5 +1317,15 @@ public class EnglishStemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof EnglishStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return EnglishStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,130 +1,137 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class FinnishStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "pa", -1, 1, "", this),
|
||||
new Among ( "sti", -1, 2, "", this),
|
||||
new Among ( "kaan", -1, 1, "", this),
|
||||
new Among ( "han", -1, 1, "", this),
|
||||
new Among ( "kin", -1, 1, "", this),
|
||||
new Among ( "h\u00E4n", -1, 1, "", this),
|
||||
new Among ( "k\u00E4\u00E4n", -1, 1, "", this),
|
||||
new Among ( "ko", -1, 1, "", this),
|
||||
new Among ( "p\u00E4", -1, 1, "", this),
|
||||
new Among ( "k\u00F6", -1, 1, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static FinnishStemmer methodObject = new FinnishStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "pa", -1, 1, "", methodObject ),
|
||||
new Among ( "sti", -1, 2, "", methodObject ),
|
||||
new Among ( "kaan", -1, 1, "", methodObject ),
|
||||
new Among ( "han", -1, 1, "", methodObject ),
|
||||
new Among ( "kin", -1, 1, "", methodObject ),
|
||||
new Among ( "h\u00E4n", -1, 1, "", methodObject ),
|
||||
new Among ( "k\u00E4\u00E4n", -1, 1, "", methodObject ),
|
||||
new Among ( "ko", -1, 1, "", methodObject ),
|
||||
new Among ( "p\u00E4", -1, 1, "", methodObject ),
|
||||
new Among ( "k\u00F6", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "lla", -1, -1, "", this),
|
||||
new Among ( "na", -1, -1, "", this),
|
||||
new Among ( "ssa", -1, -1, "", this),
|
||||
new Among ( "ta", -1, -1, "", this),
|
||||
new Among ( "lta", 3, -1, "", this),
|
||||
new Among ( "sta", 3, -1, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "lla", -1, -1, "", methodObject ),
|
||||
new Among ( "na", -1, -1, "", methodObject ),
|
||||
new Among ( "ssa", -1, -1, "", methodObject ),
|
||||
new Among ( "ta", -1, -1, "", methodObject ),
|
||||
new Among ( "lta", 3, -1, "", methodObject ),
|
||||
new Among ( "sta", 3, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "ll\u00E4", -1, -1, "", this),
|
||||
new Among ( "n\u00E4", -1, -1, "", this),
|
||||
new Among ( "ss\u00E4", -1, -1, "", this),
|
||||
new Among ( "t\u00E4", -1, -1, "", this),
|
||||
new Among ( "lt\u00E4", 3, -1, "", this),
|
||||
new Among ( "st\u00E4", 3, -1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "ll\u00E4", -1, -1, "", methodObject ),
|
||||
new Among ( "n\u00E4", -1, -1, "", methodObject ),
|
||||
new Among ( "ss\u00E4", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u00E4", -1, -1, "", methodObject ),
|
||||
new Among ( "lt\u00E4", 3, -1, "", methodObject ),
|
||||
new Among ( "st\u00E4", 3, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "lle", -1, -1, "", this),
|
||||
new Among ( "ine", -1, -1, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "lle", -1, -1, "", methodObject ),
|
||||
new Among ( "ine", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "nsa", -1, 3, "", this),
|
||||
new Among ( "mme", -1, 3, "", this),
|
||||
new Among ( "nne", -1, 3, "", this),
|
||||
new Among ( "ni", -1, 2, "", this),
|
||||
new Among ( "si", -1, 1, "", this),
|
||||
new Among ( "an", -1, 4, "", this),
|
||||
new Among ( "en", -1, 6, "", this),
|
||||
new Among ( "\u00E4n", -1, 5, "", this),
|
||||
new Among ( "ns\u00E4", -1, 3, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "nsa", -1, 3, "", methodObject ),
|
||||
new Among ( "mme", -1, 3, "", methodObject ),
|
||||
new Among ( "nne", -1, 3, "", methodObject ),
|
||||
new Among ( "ni", -1, 2, "", methodObject ),
|
||||
new Among ( "si", -1, 1, "", methodObject ),
|
||||
new Among ( "an", -1, 4, "", methodObject ),
|
||||
new Among ( "en", -1, 6, "", methodObject ),
|
||||
new Among ( "\u00E4n", -1, 5, "", methodObject ),
|
||||
new Among ( "ns\u00E4", -1, 3, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "aa", -1, -1, "", this),
|
||||
new Among ( "ee", -1, -1, "", this),
|
||||
new Among ( "ii", -1, -1, "", this),
|
||||
new Among ( "oo", -1, -1, "", this),
|
||||
new Among ( "uu", -1, -1, "", this),
|
||||
new Among ( "\u00E4\u00E4", -1, -1, "", this),
|
||||
new Among ( "\u00F6\u00F6", -1, -1, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "aa", -1, -1, "", methodObject ),
|
||||
new Among ( "ee", -1, -1, "", methodObject ),
|
||||
new Among ( "ii", -1, -1, "", methodObject ),
|
||||
new Among ( "oo", -1, -1, "", methodObject ),
|
||||
new Among ( "uu", -1, -1, "", methodObject ),
|
||||
new Among ( "\u00E4\u00E4", -1, -1, "", methodObject ),
|
||||
new Among ( "\u00F6\u00F6", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_6[] = {
|
||||
new Among ( "a", -1, 8, "", this),
|
||||
new Among ( "lla", 0, -1, "", this),
|
||||
new Among ( "na", 0, -1, "", this),
|
||||
new Among ( "ssa", 0, -1, "", this),
|
||||
new Among ( "ta", 0, -1, "", this),
|
||||
new Among ( "lta", 4, -1, "", this),
|
||||
new Among ( "sta", 4, -1, "", this),
|
||||
new Among ( "tta", 4, 9, "", this),
|
||||
new Among ( "lle", -1, -1, "", this),
|
||||
new Among ( "ine", -1, -1, "", this),
|
||||
new Among ( "ksi", -1, -1, "", this),
|
||||
new Among ( "n", -1, 7, "", this),
|
||||
new Among ( "han", 11, 1, "", this),
|
||||
new Among ( "den", 11, -1, "r_VI", this),
|
||||
new Among ( "seen", 11, -1, "r_LONG", this),
|
||||
new Among ( "hen", 11, 2, "", this),
|
||||
new Among ( "tten", 11, -1, "r_VI", this),
|
||||
new Among ( "hin", 11, 3, "", this),
|
||||
new Among ( "siin", 11, -1, "r_VI", this),
|
||||
new Among ( "hon", 11, 4, "", this),
|
||||
new Among ( "h\u00E4n", 11, 5, "", this),
|
||||
new Among ( "h\u00F6n", 11, 6, "", this),
|
||||
new Among ( "\u00E4", -1, 8, "", this),
|
||||
new Among ( "ll\u00E4", 22, -1, "", this),
|
||||
new Among ( "n\u00E4", 22, -1, "", this),
|
||||
new Among ( "ss\u00E4", 22, -1, "", this),
|
||||
new Among ( "t\u00E4", 22, -1, "", this),
|
||||
new Among ( "lt\u00E4", 26, -1, "", this),
|
||||
new Among ( "st\u00E4", 26, -1, "", this),
|
||||
new Among ( "tt\u00E4", 26, 9, "", this)
|
||||
private final static Among a_6[] = {
|
||||
new Among ( "a", -1, 8, "", methodObject ),
|
||||
new Among ( "lla", 0, -1, "", methodObject ),
|
||||
new Among ( "na", 0, -1, "", methodObject ),
|
||||
new Among ( "ssa", 0, -1, "", methodObject ),
|
||||
new Among ( "ta", 0, -1, "", methodObject ),
|
||||
new Among ( "lta", 4, -1, "", methodObject ),
|
||||
new Among ( "sta", 4, -1, "", methodObject ),
|
||||
new Among ( "tta", 4, 9, "", methodObject ),
|
||||
new Among ( "lle", -1, -1, "", methodObject ),
|
||||
new Among ( "ine", -1, -1, "", methodObject ),
|
||||
new Among ( "ksi", -1, -1, "", methodObject ),
|
||||
new Among ( "n", -1, 7, "", methodObject ),
|
||||
new Among ( "han", 11, 1, "", methodObject ),
|
||||
new Among ( "den", 11, -1, "r_VI", methodObject ),
|
||||
new Among ( "seen", 11, -1, "r_LONG", methodObject ),
|
||||
new Among ( "hen", 11, 2, "", methodObject ),
|
||||
new Among ( "tten", 11, -1, "r_VI", methodObject ),
|
||||
new Among ( "hin", 11, 3, "", methodObject ),
|
||||
new Among ( "siin", 11, -1, "r_VI", methodObject ),
|
||||
new Among ( "hon", 11, 4, "", methodObject ),
|
||||
new Among ( "h\u00E4n", 11, 5, "", methodObject ),
|
||||
new Among ( "h\u00F6n", 11, 6, "", methodObject ),
|
||||
new Among ( "\u00E4", -1, 8, "", methodObject ),
|
||||
new Among ( "ll\u00E4", 22, -1, "", methodObject ),
|
||||
new Among ( "n\u00E4", 22, -1, "", methodObject ),
|
||||
new Among ( "ss\u00E4", 22, -1, "", methodObject ),
|
||||
new Among ( "t\u00E4", 22, -1, "", methodObject ),
|
||||
new Among ( "lt\u00E4", 26, -1, "", methodObject ),
|
||||
new Among ( "st\u00E4", 26, -1, "", methodObject ),
|
||||
new Among ( "tt\u00E4", 26, 9, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_7[] = {
|
||||
new Among ( "eja", -1, -1, "", this),
|
||||
new Among ( "mma", -1, 1, "", this),
|
||||
new Among ( "imma", 1, -1, "", this),
|
||||
new Among ( "mpa", -1, 1, "", this),
|
||||
new Among ( "impa", 3, -1, "", this),
|
||||
new Among ( "mmi", -1, 1, "", this),
|
||||
new Among ( "immi", 5, -1, "", this),
|
||||
new Among ( "mpi", -1, 1, "", this),
|
||||
new Among ( "impi", 7, -1, "", this),
|
||||
new Among ( "ej\u00E4", -1, -1, "", this),
|
||||
new Among ( "mm\u00E4", -1, 1, "", this),
|
||||
new Among ( "imm\u00E4", 10, -1, "", this),
|
||||
new Among ( "mp\u00E4", -1, 1, "", this),
|
||||
new Among ( "imp\u00E4", 12, -1, "", this)
|
||||
private final static Among a_7[] = {
|
||||
new Among ( "eja", -1, -1, "", methodObject ),
|
||||
new Among ( "mma", -1, 1, "", methodObject ),
|
||||
new Among ( "imma", 1, -1, "", methodObject ),
|
||||
new Among ( "mpa", -1, 1, "", methodObject ),
|
||||
new Among ( "impa", 3, -1, "", methodObject ),
|
||||
new Among ( "mmi", -1, 1, "", methodObject ),
|
||||
new Among ( "immi", 5, -1, "", methodObject ),
|
||||
new Among ( "mpi", -1, 1, "", methodObject ),
|
||||
new Among ( "impi", 7, -1, "", methodObject ),
|
||||
new Among ( "ej\u00E4", -1, -1, "", methodObject ),
|
||||
new Among ( "mm\u00E4", -1, 1, "", methodObject ),
|
||||
new Among ( "imm\u00E4", 10, -1, "", methodObject ),
|
||||
new Among ( "mp\u00E4", -1, 1, "", methodObject ),
|
||||
new Among ( "imp\u00E4", 12, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_8[] = {
|
||||
new Among ( "i", -1, -1, "", this),
|
||||
new Among ( "j", -1, -1, "", this)
|
||||
private final static Among a_8[] = {
|
||||
new Among ( "i", -1, -1, "", methodObject ),
|
||||
new Among ( "j", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_9[] = {
|
||||
new Among ( "mma", -1, 1, "", this),
|
||||
new Among ( "imma", 0, -1, "", this)
|
||||
private final static Among a_9[] = {
|
||||
new Among ( "mma", -1, 1, "", methodObject ),
|
||||
new Among ( "imma", 0, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_AEI[] = {17, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8 };
|
||||
|
@ -136,7 +143,7 @@ public class FinnishStemmer extends SnowballProgram {
|
|||
private static final char g_particle_end[] = {17, 97, 24, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32 };
|
||||
|
||||
private boolean B_ending_removed;
|
||||
private StringBuilder S_x = new StringBuilder();
|
||||
private java.lang.StringBuilder S_x = new java.lang.StringBuilder();
|
||||
private int I_p2;
|
||||
private int I_p1;
|
||||
|
||||
|
@ -1030,5 +1037,15 @@ public class FinnishStemmer extends SnowballProgram {
|
|||
cursor = limit_backward; return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof FinnishStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return FinnishStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,183 +1,190 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class FrenchStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "col", -1, -1, "", this),
|
||||
new Among ( "par", -1, -1, "", this),
|
||||
new Among ( "tap", -1, -1, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static FrenchStemmer methodObject = new FrenchStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "col", -1, -1, "", methodObject ),
|
||||
new Among ( "par", -1, -1, "", methodObject ),
|
||||
new Among ( "tap", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "", -1, 4, "", this),
|
||||
new Among ( "I", 0, 1, "", this),
|
||||
new Among ( "U", 0, 2, "", this),
|
||||
new Among ( "Y", 0, 3, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "", -1, 4, "", methodObject ),
|
||||
new Among ( "I", 0, 1, "", methodObject ),
|
||||
new Among ( "U", 0, 2, "", methodObject ),
|
||||
new Among ( "Y", 0, 3, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "iqU", -1, 3, "", this),
|
||||
new Among ( "abl", -1, 3, "", this),
|
||||
new Among ( "I\u00E8r", -1, 4, "", this),
|
||||
new Among ( "i\u00E8r", -1, 4, "", this),
|
||||
new Among ( "eus", -1, 2, "", this),
|
||||
new Among ( "iv", -1, 1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "iqU", -1, 3, "", methodObject ),
|
||||
new Among ( "abl", -1, 3, "", methodObject ),
|
||||
new Among ( "I\u00E8r", -1, 4, "", methodObject ),
|
||||
new Among ( "i\u00E8r", -1, 4, "", methodObject ),
|
||||
new Among ( "eus", -1, 2, "", methodObject ),
|
||||
new Among ( "iv", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "ic", -1, 2, "", this),
|
||||
new Among ( "abil", -1, 1, "", this),
|
||||
new Among ( "iv", -1, 3, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "ic", -1, 2, "", methodObject ),
|
||||
new Among ( "abil", -1, 1, "", methodObject ),
|
||||
new Among ( "iv", -1, 3, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "iqUe", -1, 1, "", this),
|
||||
new Among ( "atrice", -1, 2, "", this),
|
||||
new Among ( "ance", -1, 1, "", this),
|
||||
new Among ( "ence", -1, 5, "", this),
|
||||
new Among ( "logie", -1, 3, "", this),
|
||||
new Among ( "able", -1, 1, "", this),
|
||||
new Among ( "isme", -1, 1, "", this),
|
||||
new Among ( "euse", -1, 11, "", this),
|
||||
new Among ( "iste", -1, 1, "", this),
|
||||
new Among ( "ive", -1, 8, "", this),
|
||||
new Among ( "if", -1, 8, "", this),
|
||||
new Among ( "usion", -1, 4, "", this),
|
||||
new Among ( "ation", -1, 2, "", this),
|
||||
new Among ( "ution", -1, 4, "", this),
|
||||
new Among ( "ateur", -1, 2, "", this),
|
||||
new Among ( "iqUes", -1, 1, "", this),
|
||||
new Among ( "atrices", -1, 2, "", this),
|
||||
new Among ( "ances", -1, 1, "", this),
|
||||
new Among ( "ences", -1, 5, "", this),
|
||||
new Among ( "logies", -1, 3, "", this),
|
||||
new Among ( "ables", -1, 1, "", this),
|
||||
new Among ( "ismes", -1, 1, "", this),
|
||||
new Among ( "euses", -1, 11, "", this),
|
||||
new Among ( "istes", -1, 1, "", this),
|
||||
new Among ( "ives", -1, 8, "", this),
|
||||
new Among ( "ifs", -1, 8, "", this),
|
||||
new Among ( "usions", -1, 4, "", this),
|
||||
new Among ( "ations", -1, 2, "", this),
|
||||
new Among ( "utions", -1, 4, "", this),
|
||||
new Among ( "ateurs", -1, 2, "", this),
|
||||
new Among ( "ments", -1, 15, "", this),
|
||||
new Among ( "ements", 30, 6, "", this),
|
||||
new Among ( "issements", 31, 12, "", this),
|
||||
new Among ( "it\u00E9s", -1, 7, "", this),
|
||||
new Among ( "ment", -1, 15, "", this),
|
||||
new Among ( "ement", 34, 6, "", this),
|
||||
new Among ( "issement", 35, 12, "", this),
|
||||
new Among ( "amment", 34, 13, "", this),
|
||||
new Among ( "emment", 34, 14, "", this),
|
||||
new Among ( "aux", -1, 10, "", this),
|
||||
new Among ( "eaux", 39, 9, "", this),
|
||||
new Among ( "eux", -1, 1, "", this),
|
||||
new Among ( "it\u00E9", -1, 7, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "iqUe", -1, 1, "", methodObject ),
|
||||
new Among ( "atrice", -1, 2, "", methodObject ),
|
||||
new Among ( "ance", -1, 1, "", methodObject ),
|
||||
new Among ( "ence", -1, 5, "", methodObject ),
|
||||
new Among ( "logie", -1, 3, "", methodObject ),
|
||||
new Among ( "able", -1, 1, "", methodObject ),
|
||||
new Among ( "isme", -1, 1, "", methodObject ),
|
||||
new Among ( "euse", -1, 11, "", methodObject ),
|
||||
new Among ( "iste", -1, 1, "", methodObject ),
|
||||
new Among ( "ive", -1, 8, "", methodObject ),
|
||||
new Among ( "if", -1, 8, "", methodObject ),
|
||||
new Among ( "usion", -1, 4, "", methodObject ),
|
||||
new Among ( "ation", -1, 2, "", methodObject ),
|
||||
new Among ( "ution", -1, 4, "", methodObject ),
|
||||
new Among ( "ateur", -1, 2, "", methodObject ),
|
||||
new Among ( "iqUes", -1, 1, "", methodObject ),
|
||||
new Among ( "atrices", -1, 2, "", methodObject ),
|
||||
new Among ( "ances", -1, 1, "", methodObject ),
|
||||
new Among ( "ences", -1, 5, "", methodObject ),
|
||||
new Among ( "logies", -1, 3, "", methodObject ),
|
||||
new Among ( "ables", -1, 1, "", methodObject ),
|
||||
new Among ( "ismes", -1, 1, "", methodObject ),
|
||||
new Among ( "euses", -1, 11, "", methodObject ),
|
||||
new Among ( "istes", -1, 1, "", methodObject ),
|
||||
new Among ( "ives", -1, 8, "", methodObject ),
|
||||
new Among ( "ifs", -1, 8, "", methodObject ),
|
||||
new Among ( "usions", -1, 4, "", methodObject ),
|
||||
new Among ( "ations", -1, 2, "", methodObject ),
|
||||
new Among ( "utions", -1, 4, "", methodObject ),
|
||||
new Among ( "ateurs", -1, 2, "", methodObject ),
|
||||
new Among ( "ments", -1, 15, "", methodObject ),
|
||||
new Among ( "ements", 30, 6, "", methodObject ),
|
||||
new Among ( "issements", 31, 12, "", methodObject ),
|
||||
new Among ( "it\u00E9s", -1, 7, "", methodObject ),
|
||||
new Among ( "ment", -1, 15, "", methodObject ),
|
||||
new Among ( "ement", 34, 6, "", methodObject ),
|
||||
new Among ( "issement", 35, 12, "", methodObject ),
|
||||
new Among ( "amment", 34, 13, "", methodObject ),
|
||||
new Among ( "emment", 34, 14, "", methodObject ),
|
||||
new Among ( "aux", -1, 10, "", methodObject ),
|
||||
new Among ( "eaux", 39, 9, "", methodObject ),
|
||||
new Among ( "eux", -1, 1, "", methodObject ),
|
||||
new Among ( "it\u00E9", -1, 7, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "ira", -1, 1, "", this),
|
||||
new Among ( "ie", -1, 1, "", this),
|
||||
new Among ( "isse", -1, 1, "", this),
|
||||
new Among ( "issante", -1, 1, "", this),
|
||||
new Among ( "i", -1, 1, "", this),
|
||||
new Among ( "irai", 4, 1, "", this),
|
||||
new Among ( "ir", -1, 1, "", this),
|
||||
new Among ( "iras", -1, 1, "", this),
|
||||
new Among ( "ies", -1, 1, "", this),
|
||||
new Among ( "\u00EEmes", -1, 1, "", this),
|
||||
new Among ( "isses", -1, 1, "", this),
|
||||
new Among ( "issantes", -1, 1, "", this),
|
||||
new Among ( "\u00EEtes", -1, 1, "", this),
|
||||
new Among ( "is", -1, 1, "", this),
|
||||
new Among ( "irais", 13, 1, "", this),
|
||||
new Among ( "issais", 13, 1, "", this),
|
||||
new Among ( "irions", -1, 1, "", this),
|
||||
new Among ( "issions", -1, 1, "", this),
|
||||
new Among ( "irons", -1, 1, "", this),
|
||||
new Among ( "issons", -1, 1, "", this),
|
||||
new Among ( "issants", -1, 1, "", this),
|
||||
new Among ( "it", -1, 1, "", this),
|
||||
new Among ( "irait", 21, 1, "", this),
|
||||
new Among ( "issait", 21, 1, "", this),
|
||||
new Among ( "issant", -1, 1, "", this),
|
||||
new Among ( "iraIent", -1, 1, "", this),
|
||||
new Among ( "issaIent", -1, 1, "", this),
|
||||
new Among ( "irent", -1, 1, "", this),
|
||||
new Among ( "issent", -1, 1, "", this),
|
||||
new Among ( "iront", -1, 1, "", this),
|
||||
new Among ( "\u00EEt", -1, 1, "", this),
|
||||
new Among ( "iriez", -1, 1, "", this),
|
||||
new Among ( "issiez", -1, 1, "", this),
|
||||
new Among ( "irez", -1, 1, "", this),
|
||||
new Among ( "issez", -1, 1, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "ira", -1, 1, "", methodObject ),
|
||||
new Among ( "ie", -1, 1, "", methodObject ),
|
||||
new Among ( "isse", -1, 1, "", methodObject ),
|
||||
new Among ( "issante", -1, 1, "", methodObject ),
|
||||
new Among ( "i", -1, 1, "", methodObject ),
|
||||
new Among ( "irai", 4, 1, "", methodObject ),
|
||||
new Among ( "ir", -1, 1, "", methodObject ),
|
||||
new Among ( "iras", -1, 1, "", methodObject ),
|
||||
new Among ( "ies", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00EEmes", -1, 1, "", methodObject ),
|
||||
new Among ( "isses", -1, 1, "", methodObject ),
|
||||
new Among ( "issantes", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00EEtes", -1, 1, "", methodObject ),
|
||||
new Among ( "is", -1, 1, "", methodObject ),
|
||||
new Among ( "irais", 13, 1, "", methodObject ),
|
||||
new Among ( "issais", 13, 1, "", methodObject ),
|
||||
new Among ( "irions", -1, 1, "", methodObject ),
|
||||
new Among ( "issions", -1, 1, "", methodObject ),
|
||||
new Among ( "irons", -1, 1, "", methodObject ),
|
||||
new Among ( "issons", -1, 1, "", methodObject ),
|
||||
new Among ( "issants", -1, 1, "", methodObject ),
|
||||
new Among ( "it", -1, 1, "", methodObject ),
|
||||
new Among ( "irait", 21, 1, "", methodObject ),
|
||||
new Among ( "issait", 21, 1, "", methodObject ),
|
||||
new Among ( "issant", -1, 1, "", methodObject ),
|
||||
new Among ( "iraIent", -1, 1, "", methodObject ),
|
||||
new Among ( "issaIent", -1, 1, "", methodObject ),
|
||||
new Among ( "irent", -1, 1, "", methodObject ),
|
||||
new Among ( "issent", -1, 1, "", methodObject ),
|
||||
new Among ( "iront", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00EEt", -1, 1, "", methodObject ),
|
||||
new Among ( "iriez", -1, 1, "", methodObject ),
|
||||
new Among ( "issiez", -1, 1, "", methodObject ),
|
||||
new Among ( "irez", -1, 1, "", methodObject ),
|
||||
new Among ( "issez", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_6[] = {
|
||||
new Among ( "a", -1, 3, "", this),
|
||||
new Among ( "era", 0, 2, "", this),
|
||||
new Among ( "asse", -1, 3, "", this),
|
||||
new Among ( "ante", -1, 3, "", this),
|
||||
new Among ( "\u00E9e", -1, 2, "", this),
|
||||
new Among ( "ai", -1, 3, "", this),
|
||||
new Among ( "erai", 5, 2, "", this),
|
||||
new Among ( "er", -1, 2, "", this),
|
||||
new Among ( "as", -1, 3, "", this),
|
||||
new Among ( "eras", 8, 2, "", this),
|
||||
new Among ( "\u00E2mes", -1, 3, "", this),
|
||||
new Among ( "asses", -1, 3, "", this),
|
||||
new Among ( "antes", -1, 3, "", this),
|
||||
new Among ( "\u00E2tes", -1, 3, "", this),
|
||||
new Among ( "\u00E9es", -1, 2, "", this),
|
||||
new Among ( "ais", -1, 3, "", this),
|
||||
new Among ( "erais", 15, 2, "", this),
|
||||
new Among ( "ions", -1, 1, "", this),
|
||||
new Among ( "erions", 17, 2, "", this),
|
||||
new Among ( "assions", 17, 3, "", this),
|
||||
new Among ( "erons", -1, 2, "", this),
|
||||
new Among ( "ants", -1, 3, "", this),
|
||||
new Among ( "\u00E9s", -1, 2, "", this),
|
||||
new Among ( "ait", -1, 3, "", this),
|
||||
new Among ( "erait", 23, 2, "", this),
|
||||
new Among ( "ant", -1, 3, "", this),
|
||||
new Among ( "aIent", -1, 3, "", this),
|
||||
new Among ( "eraIent", 26, 2, "", this),
|
||||
new Among ( "\u00E8rent", -1, 2, "", this),
|
||||
new Among ( "assent", -1, 3, "", this),
|
||||
new Among ( "eront", -1, 2, "", this),
|
||||
new Among ( "\u00E2t", -1, 3, "", this),
|
||||
new Among ( "ez", -1, 2, "", this),
|
||||
new Among ( "iez", 32, 2, "", this),
|
||||
new Among ( "eriez", 33, 2, "", this),
|
||||
new Among ( "assiez", 33, 3, "", this),
|
||||
new Among ( "erez", 32, 2, "", this),
|
||||
new Among ( "\u00E9", -1, 2, "", this)
|
||||
private final static Among a_6[] = {
|
||||
new Among ( "a", -1, 3, "", methodObject ),
|
||||
new Among ( "era", 0, 2, "", methodObject ),
|
||||
new Among ( "asse", -1, 3, "", methodObject ),
|
||||
new Among ( "ante", -1, 3, "", methodObject ),
|
||||
new Among ( "\u00E9e", -1, 2, "", methodObject ),
|
||||
new Among ( "ai", -1, 3, "", methodObject ),
|
||||
new Among ( "erai", 5, 2, "", methodObject ),
|
||||
new Among ( "er", -1, 2, "", methodObject ),
|
||||
new Among ( "as", -1, 3, "", methodObject ),
|
||||
new Among ( "eras", 8, 2, "", methodObject ),
|
||||
new Among ( "\u00E2mes", -1, 3, "", methodObject ),
|
||||
new Among ( "asses", -1, 3, "", methodObject ),
|
||||
new Among ( "antes", -1, 3, "", methodObject ),
|
||||
new Among ( "\u00E2tes", -1, 3, "", methodObject ),
|
||||
new Among ( "\u00E9es", -1, 2, "", methodObject ),
|
||||
new Among ( "ais", -1, 3, "", methodObject ),
|
||||
new Among ( "erais", 15, 2, "", methodObject ),
|
||||
new Among ( "ions", -1, 1, "", methodObject ),
|
||||
new Among ( "erions", 17, 2, "", methodObject ),
|
||||
new Among ( "assions", 17, 3, "", methodObject ),
|
||||
new Among ( "erons", -1, 2, "", methodObject ),
|
||||
new Among ( "ants", -1, 3, "", methodObject ),
|
||||
new Among ( "\u00E9s", -1, 2, "", methodObject ),
|
||||
new Among ( "ait", -1, 3, "", methodObject ),
|
||||
new Among ( "erait", 23, 2, "", methodObject ),
|
||||
new Among ( "ant", -1, 3, "", methodObject ),
|
||||
new Among ( "aIent", -1, 3, "", methodObject ),
|
||||
new Among ( "eraIent", 26, 2, "", methodObject ),
|
||||
new Among ( "\u00E8rent", -1, 2, "", methodObject ),
|
||||
new Among ( "assent", -1, 3, "", methodObject ),
|
||||
new Among ( "eront", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00E2t", -1, 3, "", methodObject ),
|
||||
new Among ( "ez", -1, 2, "", methodObject ),
|
||||
new Among ( "iez", 32, 2, "", methodObject ),
|
||||
new Among ( "eriez", 33, 2, "", methodObject ),
|
||||
new Among ( "assiez", 33, 3, "", methodObject ),
|
||||
new Among ( "erez", 32, 2, "", methodObject ),
|
||||
new Among ( "\u00E9", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_7[] = {
|
||||
new Among ( "e", -1, 3, "", this),
|
||||
new Among ( "I\u00E8re", 0, 2, "", this),
|
||||
new Among ( "i\u00E8re", 0, 2, "", this),
|
||||
new Among ( "ion", -1, 1, "", this),
|
||||
new Among ( "Ier", -1, 2, "", this),
|
||||
new Among ( "ier", -1, 2, "", this),
|
||||
new Among ( "\u00EB", -1, 4, "", this)
|
||||
private final static Among a_7[] = {
|
||||
new Among ( "e", -1, 3, "", methodObject ),
|
||||
new Among ( "I\u00E8re", 0, 2, "", methodObject ),
|
||||
new Among ( "i\u00E8re", 0, 2, "", methodObject ),
|
||||
new Among ( "ion", -1, 1, "", methodObject ),
|
||||
new Among ( "Ier", -1, 2, "", methodObject ),
|
||||
new Among ( "ier", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00EB", -1, 4, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_8[] = {
|
||||
new Among ( "ell", -1, -1, "", this),
|
||||
new Among ( "eill", -1, -1, "", this),
|
||||
new Among ( "enn", -1, -1, "", this),
|
||||
new Among ( "onn", -1, -1, "", this),
|
||||
new Among ( "ett", -1, -1, "", this)
|
||||
private final static Among a_8[] = {
|
||||
new Among ( "ell", -1, -1, "", methodObject ),
|
||||
new Among ( "eill", -1, -1, "", methodObject ),
|
||||
new Among ( "enn", -1, -1, "", methodObject ),
|
||||
new Among ( "onn", -1, -1, "", methodObject ),
|
||||
new Among ( "ett", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 128, 130, 103, 8, 5 };
|
||||
|
@ -1497,5 +1504,15 @@ public class FrenchStemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof FrenchStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return FrenchStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,63 +1,70 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class German2Stemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "", -1, 6, "", this),
|
||||
new Among ( "ae", 0, 2, "", this),
|
||||
new Among ( "oe", 0, 3, "", this),
|
||||
new Among ( "qu", 0, 5, "", this),
|
||||
new Among ( "ue", 0, 4, "", this),
|
||||
new Among ( "\u00DF", 0, 1, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static German2Stemmer methodObject = new German2Stemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "", -1, 6, "", methodObject ),
|
||||
new Among ( "ae", 0, 2, "", methodObject ),
|
||||
new Among ( "oe", 0, 3, "", methodObject ),
|
||||
new Among ( "qu", 0, 5, "", methodObject ),
|
||||
new Among ( "ue", 0, 4, "", methodObject ),
|
||||
new Among ( "\u00DF", 0, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "", -1, 6, "", this),
|
||||
new Among ( "U", 0, 2, "", this),
|
||||
new Among ( "Y", 0, 1, "", this),
|
||||
new Among ( "\u00E4", 0, 3, "", this),
|
||||
new Among ( "\u00F6", 0, 4, "", this),
|
||||
new Among ( "\u00FC", 0, 5, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "", -1, 6, "", methodObject ),
|
||||
new Among ( "U", 0, 2, "", methodObject ),
|
||||
new Among ( "Y", 0, 1, "", methodObject ),
|
||||
new Among ( "\u00E4", 0, 3, "", methodObject ),
|
||||
new Among ( "\u00F6", 0, 4, "", methodObject ),
|
||||
new Among ( "\u00FC", 0, 5, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "e", -1, 1, "", this),
|
||||
new Among ( "em", -1, 1, "", this),
|
||||
new Among ( "en", -1, 1, "", this),
|
||||
new Among ( "ern", -1, 1, "", this),
|
||||
new Among ( "er", -1, 1, "", this),
|
||||
new Among ( "s", -1, 2, "", this),
|
||||
new Among ( "es", 5, 1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "e", -1, 1, "", methodObject ),
|
||||
new Among ( "em", -1, 1, "", methodObject ),
|
||||
new Among ( "en", -1, 1, "", methodObject ),
|
||||
new Among ( "ern", -1, 1, "", methodObject ),
|
||||
new Among ( "er", -1, 1, "", methodObject ),
|
||||
new Among ( "s", -1, 2, "", methodObject ),
|
||||
new Among ( "es", 5, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "en", -1, 1, "", this),
|
||||
new Among ( "er", -1, 1, "", this),
|
||||
new Among ( "st", -1, 2, "", this),
|
||||
new Among ( "est", 2, 1, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "en", -1, 1, "", methodObject ),
|
||||
new Among ( "er", -1, 1, "", methodObject ),
|
||||
new Among ( "st", -1, 2, "", methodObject ),
|
||||
new Among ( "est", 2, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "ig", -1, 1, "", this),
|
||||
new Among ( "lich", -1, 1, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "ig", -1, 1, "", methodObject ),
|
||||
new Among ( "lich", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "end", -1, 1, "", this),
|
||||
new Among ( "ig", -1, 2, "", this),
|
||||
new Among ( "ung", -1, 1, "", this),
|
||||
new Among ( "lich", -1, 3, "", this),
|
||||
new Among ( "isch", -1, 2, "", this),
|
||||
new Among ( "ik", -1, 2, "", this),
|
||||
new Among ( "heit", -1, 3, "", this),
|
||||
new Among ( "keit", -1, 4, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "end", -1, 1, "", methodObject ),
|
||||
new Among ( "ig", -1, 2, "", methodObject ),
|
||||
new Among ( "ung", -1, 1, "", methodObject ),
|
||||
new Among ( "lich", -1, 3, "", methodObject ),
|
||||
new Among ( "isch", -1, 2, "", methodObject ),
|
||||
new Among ( "ik", -1, 2, "", methodObject ),
|
||||
new Among ( "heit", -1, 3, "", methodObject ),
|
||||
new Among ( "keit", -1, 4, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32, 8 };
|
||||
|
@ -722,5 +729,15 @@ public class German2Stemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof German2Stemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return German2Stemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,54 +1,61 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class GermanStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "", -1, 6, "", this),
|
||||
new Among ( "U", 0, 2, "", this),
|
||||
new Among ( "Y", 0, 1, "", this),
|
||||
new Among ( "\u00E4", 0, 3, "", this),
|
||||
new Among ( "\u00F6", 0, 4, "", this),
|
||||
new Among ( "\u00FC", 0, 5, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static GermanStemmer methodObject = new GermanStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "", -1, 6, "", methodObject ),
|
||||
new Among ( "U", 0, 2, "", methodObject ),
|
||||
new Among ( "Y", 0, 1, "", methodObject ),
|
||||
new Among ( "\u00E4", 0, 3, "", methodObject ),
|
||||
new Among ( "\u00F6", 0, 4, "", methodObject ),
|
||||
new Among ( "\u00FC", 0, 5, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "e", -1, 1, "", this),
|
||||
new Among ( "em", -1, 1, "", this),
|
||||
new Among ( "en", -1, 1, "", this),
|
||||
new Among ( "ern", -1, 1, "", this),
|
||||
new Among ( "er", -1, 1, "", this),
|
||||
new Among ( "s", -1, 2, "", this),
|
||||
new Among ( "es", 5, 1, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "e", -1, 1, "", methodObject ),
|
||||
new Among ( "em", -1, 1, "", methodObject ),
|
||||
new Among ( "en", -1, 1, "", methodObject ),
|
||||
new Among ( "ern", -1, 1, "", methodObject ),
|
||||
new Among ( "er", -1, 1, "", methodObject ),
|
||||
new Among ( "s", -1, 2, "", methodObject ),
|
||||
new Among ( "es", 5, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "en", -1, 1, "", this),
|
||||
new Among ( "er", -1, 1, "", this),
|
||||
new Among ( "st", -1, 2, "", this),
|
||||
new Among ( "est", 2, 1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "en", -1, 1, "", methodObject ),
|
||||
new Among ( "er", -1, 1, "", methodObject ),
|
||||
new Among ( "st", -1, 2, "", methodObject ),
|
||||
new Among ( "est", 2, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "ig", -1, 1, "", this),
|
||||
new Among ( "lich", -1, 1, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "ig", -1, 1, "", methodObject ),
|
||||
new Among ( "lich", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "end", -1, 1, "", this),
|
||||
new Among ( "ig", -1, 2, "", this),
|
||||
new Among ( "ung", -1, 1, "", this),
|
||||
new Among ( "lich", -1, 3, "", this),
|
||||
new Among ( "isch", -1, 2, "", this),
|
||||
new Among ( "ik", -1, 2, "", this),
|
||||
new Among ( "heit", -1, 3, "", this),
|
||||
new Among ( "keit", -1, 4, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "end", -1, 1, "", methodObject ),
|
||||
new Among ( "ig", -1, 2, "", methodObject ),
|
||||
new Among ( "ung", -1, 1, "", methodObject ),
|
||||
new Among ( "lich", -1, 3, "", methodObject ),
|
||||
new Among ( "isch", -1, 2, "", methodObject ),
|
||||
new Among ( "ik", -1, 2, "", methodObject ),
|
||||
new Among ( "heit", -1, 3, "", methodObject ),
|
||||
new Among ( "keit", -1, 4, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 8, 0, 32, 8 };
|
||||
|
@ -684,5 +691,15 @@ public class GermanStemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof GermanStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return GermanStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,230 +1,237 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class HungarianStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "cs", -1, -1, "", this),
|
||||
new Among ( "dzs", -1, -1, "", this),
|
||||
new Among ( "gy", -1, -1, "", this),
|
||||
new Among ( "ly", -1, -1, "", this),
|
||||
new Among ( "ny", -1, -1, "", this),
|
||||
new Among ( "sz", -1, -1, "", this),
|
||||
new Among ( "ty", -1, -1, "", this),
|
||||
new Among ( "zs", -1, -1, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static HungarianStemmer methodObject = new HungarianStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "cs", -1, -1, "", methodObject ),
|
||||
new Among ( "dzs", -1, -1, "", methodObject ),
|
||||
new Among ( "gy", -1, -1, "", methodObject ),
|
||||
new Among ( "ly", -1, -1, "", methodObject ),
|
||||
new Among ( "ny", -1, -1, "", methodObject ),
|
||||
new Among ( "sz", -1, -1, "", methodObject ),
|
||||
new Among ( "ty", -1, -1, "", methodObject ),
|
||||
new Among ( "zs", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "\u00E1", -1, 1, "", this),
|
||||
new Among ( "\u00E9", -1, 2, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "\u00E1", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E9", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "bb", -1, -1, "", this),
|
||||
new Among ( "cc", -1, -1, "", this),
|
||||
new Among ( "dd", -1, -1, "", this),
|
||||
new Among ( "ff", -1, -1, "", this),
|
||||
new Among ( "gg", -1, -1, "", this),
|
||||
new Among ( "jj", -1, -1, "", this),
|
||||
new Among ( "kk", -1, -1, "", this),
|
||||
new Among ( "ll", -1, -1, "", this),
|
||||
new Among ( "mm", -1, -1, "", this),
|
||||
new Among ( "nn", -1, -1, "", this),
|
||||
new Among ( "pp", -1, -1, "", this),
|
||||
new Among ( "rr", -1, -1, "", this),
|
||||
new Among ( "ccs", -1, -1, "", this),
|
||||
new Among ( "ss", -1, -1, "", this),
|
||||
new Among ( "zzs", -1, -1, "", this),
|
||||
new Among ( "tt", -1, -1, "", this),
|
||||
new Among ( "vv", -1, -1, "", this),
|
||||
new Among ( "ggy", -1, -1, "", this),
|
||||
new Among ( "lly", -1, -1, "", this),
|
||||
new Among ( "nny", -1, -1, "", this),
|
||||
new Among ( "tty", -1, -1, "", this),
|
||||
new Among ( "ssz", -1, -1, "", this),
|
||||
new Among ( "zz", -1, -1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "bb", -1, -1, "", methodObject ),
|
||||
new Among ( "cc", -1, -1, "", methodObject ),
|
||||
new Among ( "dd", -1, -1, "", methodObject ),
|
||||
new Among ( "ff", -1, -1, "", methodObject ),
|
||||
new Among ( "gg", -1, -1, "", methodObject ),
|
||||
new Among ( "jj", -1, -1, "", methodObject ),
|
||||
new Among ( "kk", -1, -1, "", methodObject ),
|
||||
new Among ( "ll", -1, -1, "", methodObject ),
|
||||
new Among ( "mm", -1, -1, "", methodObject ),
|
||||
new Among ( "nn", -1, -1, "", methodObject ),
|
||||
new Among ( "pp", -1, -1, "", methodObject ),
|
||||
new Among ( "rr", -1, -1, "", methodObject ),
|
||||
new Among ( "ccs", -1, -1, "", methodObject ),
|
||||
new Among ( "ss", -1, -1, "", methodObject ),
|
||||
new Among ( "zzs", -1, -1, "", methodObject ),
|
||||
new Among ( "tt", -1, -1, "", methodObject ),
|
||||
new Among ( "vv", -1, -1, "", methodObject ),
|
||||
new Among ( "ggy", -1, -1, "", methodObject ),
|
||||
new Among ( "lly", -1, -1, "", methodObject ),
|
||||
new Among ( "nny", -1, -1, "", methodObject ),
|
||||
new Among ( "tty", -1, -1, "", methodObject ),
|
||||
new Among ( "ssz", -1, -1, "", methodObject ),
|
||||
new Among ( "zz", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "al", -1, 1, "", this),
|
||||
new Among ( "el", -1, 2, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "al", -1, 1, "", methodObject ),
|
||||
new Among ( "el", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "ba", -1, -1, "", this),
|
||||
new Among ( "ra", -1, -1, "", this),
|
||||
new Among ( "be", -1, -1, "", this),
|
||||
new Among ( "re", -1, -1, "", this),
|
||||
new Among ( "ig", -1, -1, "", this),
|
||||
new Among ( "nak", -1, -1, "", this),
|
||||
new Among ( "nek", -1, -1, "", this),
|
||||
new Among ( "val", -1, -1, "", this),
|
||||
new Among ( "vel", -1, -1, "", this),
|
||||
new Among ( "ul", -1, -1, "", this),
|
||||
new Among ( "n\u00E1l", -1, -1, "", this),
|
||||
new Among ( "n\u00E9l", -1, -1, "", this),
|
||||
new Among ( "b\u00F3l", -1, -1, "", this),
|
||||
new Among ( "r\u00F3l", -1, -1, "", this),
|
||||
new Among ( "t\u00F3l", -1, -1, "", this),
|
||||
new Among ( "b\u00F5l", -1, -1, "", this),
|
||||
new Among ( "r\u00F5l", -1, -1, "", this),
|
||||
new Among ( "t\u00F5l", -1, -1, "", this),
|
||||
new Among ( "\u00FCl", -1, -1, "", this),
|
||||
new Among ( "n", -1, -1, "", this),
|
||||
new Among ( "an", 19, -1, "", this),
|
||||
new Among ( "ban", 20, -1, "", this),
|
||||
new Among ( "en", 19, -1, "", this),
|
||||
new Among ( "ben", 22, -1, "", this),
|
||||
new Among ( "k\u00E9ppen", 22, -1, "", this),
|
||||
new Among ( "on", 19, -1, "", this),
|
||||
new Among ( "\u00F6n", 19, -1, "", this),
|
||||
new Among ( "k\u00E9pp", -1, -1, "", this),
|
||||
new Among ( "kor", -1, -1, "", this),
|
||||
new Among ( "t", -1, -1, "", this),
|
||||
new Among ( "at", 29, -1, "", this),
|
||||
new Among ( "et", 29, -1, "", this),
|
||||
new Among ( "k\u00E9nt", 29, -1, "", this),
|
||||
new Among ( "ank\u00E9nt", 32, -1, "", this),
|
||||
new Among ( "enk\u00E9nt", 32, -1, "", this),
|
||||
new Among ( "onk\u00E9nt", 32, -1, "", this),
|
||||
new Among ( "ot", 29, -1, "", this),
|
||||
new Among ( "\u00E9rt", 29, -1, "", this),
|
||||
new Among ( "\u00F6t", 29, -1, "", this),
|
||||
new Among ( "hez", -1, -1, "", this),
|
||||
new Among ( "hoz", -1, -1, "", this),
|
||||
new Among ( "h\u00F6z", -1, -1, "", this),
|
||||
new Among ( "v\u00E1", -1, -1, "", this),
|
||||
new Among ( "v\u00E9", -1, -1, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "ba", -1, -1, "", methodObject ),
|
||||
new Among ( "ra", -1, -1, "", methodObject ),
|
||||
new Among ( "be", -1, -1, "", methodObject ),
|
||||
new Among ( "re", -1, -1, "", methodObject ),
|
||||
new Among ( "ig", -1, -1, "", methodObject ),
|
||||
new Among ( "nak", -1, -1, "", methodObject ),
|
||||
new Among ( "nek", -1, -1, "", methodObject ),
|
||||
new Among ( "val", -1, -1, "", methodObject ),
|
||||
new Among ( "vel", -1, -1, "", methodObject ),
|
||||
new Among ( "ul", -1, -1, "", methodObject ),
|
||||
new Among ( "n\u00E1l", -1, -1, "", methodObject ),
|
||||
new Among ( "n\u00E9l", -1, -1, "", methodObject ),
|
||||
new Among ( "b\u00F3l", -1, -1, "", methodObject ),
|
||||
new Among ( "r\u00F3l", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u00F3l", -1, -1, "", methodObject ),
|
||||
new Among ( "b\u00F5l", -1, -1, "", methodObject ),
|
||||
new Among ( "r\u00F5l", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u00F5l", -1, -1, "", methodObject ),
|
||||
new Among ( "\u00FCl", -1, -1, "", methodObject ),
|
||||
new Among ( "n", -1, -1, "", methodObject ),
|
||||
new Among ( "an", 19, -1, "", methodObject ),
|
||||
new Among ( "ban", 20, -1, "", methodObject ),
|
||||
new Among ( "en", 19, -1, "", methodObject ),
|
||||
new Among ( "ben", 22, -1, "", methodObject ),
|
||||
new Among ( "k\u00E9ppen", 22, -1, "", methodObject ),
|
||||
new Among ( "on", 19, -1, "", methodObject ),
|
||||
new Among ( "\u00F6n", 19, -1, "", methodObject ),
|
||||
new Among ( "k\u00E9pp", -1, -1, "", methodObject ),
|
||||
new Among ( "kor", -1, -1, "", methodObject ),
|
||||
new Among ( "t", -1, -1, "", methodObject ),
|
||||
new Among ( "at", 29, -1, "", methodObject ),
|
||||
new Among ( "et", 29, -1, "", methodObject ),
|
||||
new Among ( "k\u00E9nt", 29, -1, "", methodObject ),
|
||||
new Among ( "ank\u00E9nt", 32, -1, "", methodObject ),
|
||||
new Among ( "enk\u00E9nt", 32, -1, "", methodObject ),
|
||||
new Among ( "onk\u00E9nt", 32, -1, "", methodObject ),
|
||||
new Among ( "ot", 29, -1, "", methodObject ),
|
||||
new Among ( "\u00E9rt", 29, -1, "", methodObject ),
|
||||
new Among ( "\u00F6t", 29, -1, "", methodObject ),
|
||||
new Among ( "hez", -1, -1, "", methodObject ),
|
||||
new Among ( "hoz", -1, -1, "", methodObject ),
|
||||
new Among ( "h\u00F6z", -1, -1, "", methodObject ),
|
||||
new Among ( "v\u00E1", -1, -1, "", methodObject ),
|
||||
new Among ( "v\u00E9", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "\u00E1n", -1, 2, "", this),
|
||||
new Among ( "\u00E9n", -1, 1, "", this),
|
||||
new Among ( "\u00E1nk\u00E9nt", -1, 3, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "\u00E1n", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00E9n", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E1nk\u00E9nt", -1, 3, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_6[] = {
|
||||
new Among ( "stul", -1, 2, "", this),
|
||||
new Among ( "astul", 0, 1, "", this),
|
||||
new Among ( "\u00E1stul", 0, 3, "", this),
|
||||
new Among ( "st\u00FCl", -1, 2, "", this),
|
||||
new Among ( "est\u00FCl", 3, 1, "", this),
|
||||
new Among ( "\u00E9st\u00FCl", 3, 4, "", this)
|
||||
private final static Among a_6[] = {
|
||||
new Among ( "stul", -1, 2, "", methodObject ),
|
||||
new Among ( "astul", 0, 1, "", methodObject ),
|
||||
new Among ( "\u00E1stul", 0, 3, "", methodObject ),
|
||||
new Among ( "st\u00FCl", -1, 2, "", methodObject ),
|
||||
new Among ( "est\u00FCl", 3, 1, "", methodObject ),
|
||||
new Among ( "\u00E9st\u00FCl", 3, 4, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_7[] = {
|
||||
new Among ( "\u00E1", -1, 1, "", this),
|
||||
new Among ( "\u00E9", -1, 2, "", this)
|
||||
private final static Among a_7[] = {
|
||||
new Among ( "\u00E1", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E9", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_8[] = {
|
||||
new Among ( "k", -1, 7, "", this),
|
||||
new Among ( "ak", 0, 4, "", this),
|
||||
new Among ( "ek", 0, 6, "", this),
|
||||
new Among ( "ok", 0, 5, "", this),
|
||||
new Among ( "\u00E1k", 0, 1, "", this),
|
||||
new Among ( "\u00E9k", 0, 2, "", this),
|
||||
new Among ( "\u00F6k", 0, 3, "", this)
|
||||
private final static Among a_8[] = {
|
||||
new Among ( "k", -1, 7, "", methodObject ),
|
||||
new Among ( "ak", 0, 4, "", methodObject ),
|
||||
new Among ( "ek", 0, 6, "", methodObject ),
|
||||
new Among ( "ok", 0, 5, "", methodObject ),
|
||||
new Among ( "\u00E1k", 0, 1, "", methodObject ),
|
||||
new Among ( "\u00E9k", 0, 2, "", methodObject ),
|
||||
new Among ( "\u00F6k", 0, 3, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_9[] = {
|
||||
new Among ( "\u00E9i", -1, 7, "", this),
|
||||
new Among ( "\u00E1\u00E9i", 0, 6, "", this),
|
||||
new Among ( "\u00E9\u00E9i", 0, 5, "", this),
|
||||
new Among ( "\u00E9", -1, 9, "", this),
|
||||
new Among ( "k\u00E9", 3, 4, "", this),
|
||||
new Among ( "ak\u00E9", 4, 1, "", this),
|
||||
new Among ( "ek\u00E9", 4, 1, "", this),
|
||||
new Among ( "ok\u00E9", 4, 1, "", this),
|
||||
new Among ( "\u00E1k\u00E9", 4, 3, "", this),
|
||||
new Among ( "\u00E9k\u00E9", 4, 2, "", this),
|
||||
new Among ( "\u00F6k\u00E9", 4, 1, "", this),
|
||||
new Among ( "\u00E9\u00E9", 3, 8, "", this)
|
||||
private final static Among a_9[] = {
|
||||
new Among ( "\u00E9i", -1, 7, "", methodObject ),
|
||||
new Among ( "\u00E1\u00E9i", 0, 6, "", methodObject ),
|
||||
new Among ( "\u00E9\u00E9i", 0, 5, "", methodObject ),
|
||||
new Among ( "\u00E9", -1, 9, "", methodObject ),
|
||||
new Among ( "k\u00E9", 3, 4, "", methodObject ),
|
||||
new Among ( "ak\u00E9", 4, 1, "", methodObject ),
|
||||
new Among ( "ek\u00E9", 4, 1, "", methodObject ),
|
||||
new Among ( "ok\u00E9", 4, 1, "", methodObject ),
|
||||
new Among ( "\u00E1k\u00E9", 4, 3, "", methodObject ),
|
||||
new Among ( "\u00E9k\u00E9", 4, 2, "", methodObject ),
|
||||
new Among ( "\u00F6k\u00E9", 4, 1, "", methodObject ),
|
||||
new Among ( "\u00E9\u00E9", 3, 8, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_10[] = {
|
||||
new Among ( "a", -1, 18, "", this),
|
||||
new Among ( "ja", 0, 17, "", this),
|
||||
new Among ( "d", -1, 16, "", this),
|
||||
new Among ( "ad", 2, 13, "", this),
|
||||
new Among ( "ed", 2, 13, "", this),
|
||||
new Among ( "od", 2, 13, "", this),
|
||||
new Among ( "\u00E1d", 2, 14, "", this),
|
||||
new Among ( "\u00E9d", 2, 15, "", this),
|
||||
new Among ( "\u00F6d", 2, 13, "", this),
|
||||
new Among ( "e", -1, 18, "", this),
|
||||
new Among ( "je", 9, 17, "", this),
|
||||
new Among ( "nk", -1, 4, "", this),
|
||||
new Among ( "unk", 11, 1, "", this),
|
||||
new Among ( "\u00E1nk", 11, 2, "", this),
|
||||
new Among ( "\u00E9nk", 11, 3, "", this),
|
||||
new Among ( "\u00FCnk", 11, 1, "", this),
|
||||
new Among ( "uk", -1, 8, "", this),
|
||||
new Among ( "juk", 16, 7, "", this),
|
||||
new Among ( "\u00E1juk", 17, 5, "", this),
|
||||
new Among ( "\u00FCk", -1, 8, "", this),
|
||||
new Among ( "j\u00FCk", 19, 7, "", this),
|
||||
new Among ( "\u00E9j\u00FCk", 20, 6, "", this),
|
||||
new Among ( "m", -1, 12, "", this),
|
||||
new Among ( "am", 22, 9, "", this),
|
||||
new Among ( "em", 22, 9, "", this),
|
||||
new Among ( "om", 22, 9, "", this),
|
||||
new Among ( "\u00E1m", 22, 10, "", this),
|
||||
new Among ( "\u00E9m", 22, 11, "", this),
|
||||
new Among ( "o", -1, 18, "", this),
|
||||
new Among ( "\u00E1", -1, 19, "", this),
|
||||
new Among ( "\u00E9", -1, 20, "", this)
|
||||
private final static Among a_10[] = {
|
||||
new Among ( "a", -1, 18, "", methodObject ),
|
||||
new Among ( "ja", 0, 17, "", methodObject ),
|
||||
new Among ( "d", -1, 16, "", methodObject ),
|
||||
new Among ( "ad", 2, 13, "", methodObject ),
|
||||
new Among ( "ed", 2, 13, "", methodObject ),
|
||||
new Among ( "od", 2, 13, "", methodObject ),
|
||||
new Among ( "\u00E1d", 2, 14, "", methodObject ),
|
||||
new Among ( "\u00E9d", 2, 15, "", methodObject ),
|
||||
new Among ( "\u00F6d", 2, 13, "", methodObject ),
|
||||
new Among ( "e", -1, 18, "", methodObject ),
|
||||
new Among ( "je", 9, 17, "", methodObject ),
|
||||
new Among ( "nk", -1, 4, "", methodObject ),
|
||||
new Among ( "unk", 11, 1, "", methodObject ),
|
||||
new Among ( "\u00E1nk", 11, 2, "", methodObject ),
|
||||
new Among ( "\u00E9nk", 11, 3, "", methodObject ),
|
||||
new Among ( "\u00FCnk", 11, 1, "", methodObject ),
|
||||
new Among ( "uk", -1, 8, "", methodObject ),
|
||||
new Among ( "juk", 16, 7, "", methodObject ),
|
||||
new Among ( "\u00E1juk", 17, 5, "", methodObject ),
|
||||
new Among ( "\u00FCk", -1, 8, "", methodObject ),
|
||||
new Among ( "j\u00FCk", 19, 7, "", methodObject ),
|
||||
new Among ( "\u00E9j\u00FCk", 20, 6, "", methodObject ),
|
||||
new Among ( "m", -1, 12, "", methodObject ),
|
||||
new Among ( "am", 22, 9, "", methodObject ),
|
||||
new Among ( "em", 22, 9, "", methodObject ),
|
||||
new Among ( "om", 22, 9, "", methodObject ),
|
||||
new Among ( "\u00E1m", 22, 10, "", methodObject ),
|
||||
new Among ( "\u00E9m", 22, 11, "", methodObject ),
|
||||
new Among ( "o", -1, 18, "", methodObject ),
|
||||
new Among ( "\u00E1", -1, 19, "", methodObject ),
|
||||
new Among ( "\u00E9", -1, 20, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_11[] = {
|
||||
new Among ( "id", -1, 10, "", this),
|
||||
new Among ( "aid", 0, 9, "", this),
|
||||
new Among ( "jaid", 1, 6, "", this),
|
||||
new Among ( "eid", 0, 9, "", this),
|
||||
new Among ( "jeid", 3, 6, "", this),
|
||||
new Among ( "\u00E1id", 0, 7, "", this),
|
||||
new Among ( "\u00E9id", 0, 8, "", this),
|
||||
new Among ( "i", -1, 15, "", this),
|
||||
new Among ( "ai", 7, 14, "", this),
|
||||
new Among ( "jai", 8, 11, "", this),
|
||||
new Among ( "ei", 7, 14, "", this),
|
||||
new Among ( "jei", 10, 11, "", this),
|
||||
new Among ( "\u00E1i", 7, 12, "", this),
|
||||
new Among ( "\u00E9i", 7, 13, "", this),
|
||||
new Among ( "itek", -1, 24, "", this),
|
||||
new Among ( "eitek", 14, 21, "", this),
|
||||
new Among ( "jeitek", 15, 20, "", this),
|
||||
new Among ( "\u00E9itek", 14, 23, "", this),
|
||||
new Among ( "ik", -1, 29, "", this),
|
||||
new Among ( "aik", 18, 26, "", this),
|
||||
new Among ( "jaik", 19, 25, "", this),
|
||||
new Among ( "eik", 18, 26, "", this),
|
||||
new Among ( "jeik", 21, 25, "", this),
|
||||
new Among ( "\u00E1ik", 18, 27, "", this),
|
||||
new Among ( "\u00E9ik", 18, 28, "", this),
|
||||
new Among ( "ink", -1, 20, "", this),
|
||||
new Among ( "aink", 25, 17, "", this),
|
||||
new Among ( "jaink", 26, 16, "", this),
|
||||
new Among ( "eink", 25, 17, "", this),
|
||||
new Among ( "jeink", 28, 16, "", this),
|
||||
new Among ( "\u00E1ink", 25, 18, "", this),
|
||||
new Among ( "\u00E9ink", 25, 19, "", this),
|
||||
new Among ( "aitok", -1, 21, "", this),
|
||||
new Among ( "jaitok", 32, 20, "", this),
|
||||
new Among ( "\u00E1itok", -1, 22, "", this),
|
||||
new Among ( "im", -1, 5, "", this),
|
||||
new Among ( "aim", 35, 4, "", this),
|
||||
new Among ( "jaim", 36, 1, "", this),
|
||||
new Among ( "eim", 35, 4, "", this),
|
||||
new Among ( "jeim", 38, 1, "", this),
|
||||
new Among ( "\u00E1im", 35, 2, "", this),
|
||||
new Among ( "\u00E9im", 35, 3, "", this)
|
||||
private final static Among a_11[] = {
|
||||
new Among ( "id", -1, 10, "", methodObject ),
|
||||
new Among ( "aid", 0, 9, "", methodObject ),
|
||||
new Among ( "jaid", 1, 6, "", methodObject ),
|
||||
new Among ( "eid", 0, 9, "", methodObject ),
|
||||
new Among ( "jeid", 3, 6, "", methodObject ),
|
||||
new Among ( "\u00E1id", 0, 7, "", methodObject ),
|
||||
new Among ( "\u00E9id", 0, 8, "", methodObject ),
|
||||
new Among ( "i", -1, 15, "", methodObject ),
|
||||
new Among ( "ai", 7, 14, "", methodObject ),
|
||||
new Among ( "jai", 8, 11, "", methodObject ),
|
||||
new Among ( "ei", 7, 14, "", methodObject ),
|
||||
new Among ( "jei", 10, 11, "", methodObject ),
|
||||
new Among ( "\u00E1i", 7, 12, "", methodObject ),
|
||||
new Among ( "\u00E9i", 7, 13, "", methodObject ),
|
||||
new Among ( "itek", -1, 24, "", methodObject ),
|
||||
new Among ( "eitek", 14, 21, "", methodObject ),
|
||||
new Among ( "jeitek", 15, 20, "", methodObject ),
|
||||
new Among ( "\u00E9itek", 14, 23, "", methodObject ),
|
||||
new Among ( "ik", -1, 29, "", methodObject ),
|
||||
new Among ( "aik", 18, 26, "", methodObject ),
|
||||
new Among ( "jaik", 19, 25, "", methodObject ),
|
||||
new Among ( "eik", 18, 26, "", methodObject ),
|
||||
new Among ( "jeik", 21, 25, "", methodObject ),
|
||||
new Among ( "\u00E1ik", 18, 27, "", methodObject ),
|
||||
new Among ( "\u00E9ik", 18, 28, "", methodObject ),
|
||||
new Among ( "ink", -1, 20, "", methodObject ),
|
||||
new Among ( "aink", 25, 17, "", methodObject ),
|
||||
new Among ( "jaink", 26, 16, "", methodObject ),
|
||||
new Among ( "eink", 25, 17, "", methodObject ),
|
||||
new Among ( "jeink", 28, 16, "", methodObject ),
|
||||
new Among ( "\u00E1ink", 25, 18, "", methodObject ),
|
||||
new Among ( "\u00E9ink", 25, 19, "", methodObject ),
|
||||
new Among ( "aitok", -1, 21, "", methodObject ),
|
||||
new Among ( "jaitok", 32, 20, "", methodObject ),
|
||||
new Among ( "\u00E1itok", -1, 22, "", methodObject ),
|
||||
new Among ( "im", -1, 5, "", methodObject ),
|
||||
new Among ( "aim", 35, 4, "", methodObject ),
|
||||
new Among ( "jaim", 36, 1, "", methodObject ),
|
||||
new Among ( "eim", 35, 4, "", methodObject ),
|
||||
new Among ( "jeim", 38, 1, "", methodObject ),
|
||||
new Among ( "\u00E1im", 35, 2, "", methodObject ),
|
||||
new Among ( "\u00E9im", 35, 3, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 17, 52, 14 };
|
||||
|
@ -1154,5 +1161,15 @@ public class HungarianStemmer extends SnowballProgram {
|
|||
cursor = limit_backward; return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof HungarianStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return HungarianStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,233 +1,240 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class ItalianStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "", -1, 7, "", this),
|
||||
new Among ( "qu", 0, 6, "", this),
|
||||
new Among ( "\u00E1", 0, 1, "", this),
|
||||
new Among ( "\u00E9", 0, 2, "", this),
|
||||
new Among ( "\u00ED", 0, 3, "", this),
|
||||
new Among ( "\u00F3", 0, 4, "", this),
|
||||
new Among ( "\u00FA", 0, 5, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static ItalianStemmer methodObject = new ItalianStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "", -1, 7, "", methodObject ),
|
||||
new Among ( "qu", 0, 6, "", methodObject ),
|
||||
new Among ( "\u00E1", 0, 1, "", methodObject ),
|
||||
new Among ( "\u00E9", 0, 2, "", methodObject ),
|
||||
new Among ( "\u00ED", 0, 3, "", methodObject ),
|
||||
new Among ( "\u00F3", 0, 4, "", methodObject ),
|
||||
new Among ( "\u00FA", 0, 5, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "", -1, 3, "", this),
|
||||
new Among ( "I", 0, 1, "", this),
|
||||
new Among ( "U", 0, 2, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "", -1, 3, "", methodObject ),
|
||||
new Among ( "I", 0, 1, "", methodObject ),
|
||||
new Among ( "U", 0, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "la", -1, -1, "", this),
|
||||
new Among ( "cela", 0, -1, "", this),
|
||||
new Among ( "gliela", 0, -1, "", this),
|
||||
new Among ( "mela", 0, -1, "", this),
|
||||
new Among ( "tela", 0, -1, "", this),
|
||||
new Among ( "vela", 0, -1, "", this),
|
||||
new Among ( "le", -1, -1, "", this),
|
||||
new Among ( "cele", 6, -1, "", this),
|
||||
new Among ( "gliele", 6, -1, "", this),
|
||||
new Among ( "mele", 6, -1, "", this),
|
||||
new Among ( "tele", 6, -1, "", this),
|
||||
new Among ( "vele", 6, -1, "", this),
|
||||
new Among ( "ne", -1, -1, "", this),
|
||||
new Among ( "cene", 12, -1, "", this),
|
||||
new Among ( "gliene", 12, -1, "", this),
|
||||
new Among ( "mene", 12, -1, "", this),
|
||||
new Among ( "sene", 12, -1, "", this),
|
||||
new Among ( "tene", 12, -1, "", this),
|
||||
new Among ( "vene", 12, -1, "", this),
|
||||
new Among ( "ci", -1, -1, "", this),
|
||||
new Among ( "li", -1, -1, "", this),
|
||||
new Among ( "celi", 20, -1, "", this),
|
||||
new Among ( "glieli", 20, -1, "", this),
|
||||
new Among ( "meli", 20, -1, "", this),
|
||||
new Among ( "teli", 20, -1, "", this),
|
||||
new Among ( "veli", 20, -1, "", this),
|
||||
new Among ( "gli", 20, -1, "", this),
|
||||
new Among ( "mi", -1, -1, "", this),
|
||||
new Among ( "si", -1, -1, "", this),
|
||||
new Among ( "ti", -1, -1, "", this),
|
||||
new Among ( "vi", -1, -1, "", this),
|
||||
new Among ( "lo", -1, -1, "", this),
|
||||
new Among ( "celo", 31, -1, "", this),
|
||||
new Among ( "glielo", 31, -1, "", this),
|
||||
new Among ( "melo", 31, -1, "", this),
|
||||
new Among ( "telo", 31, -1, "", this),
|
||||
new Among ( "velo", 31, -1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "la", -1, -1, "", methodObject ),
|
||||
new Among ( "cela", 0, -1, "", methodObject ),
|
||||
new Among ( "gliela", 0, -1, "", methodObject ),
|
||||
new Among ( "mela", 0, -1, "", methodObject ),
|
||||
new Among ( "tela", 0, -1, "", methodObject ),
|
||||
new Among ( "vela", 0, -1, "", methodObject ),
|
||||
new Among ( "le", -1, -1, "", methodObject ),
|
||||
new Among ( "cele", 6, -1, "", methodObject ),
|
||||
new Among ( "gliele", 6, -1, "", methodObject ),
|
||||
new Among ( "mele", 6, -1, "", methodObject ),
|
||||
new Among ( "tele", 6, -1, "", methodObject ),
|
||||
new Among ( "vele", 6, -1, "", methodObject ),
|
||||
new Among ( "ne", -1, -1, "", methodObject ),
|
||||
new Among ( "cene", 12, -1, "", methodObject ),
|
||||
new Among ( "gliene", 12, -1, "", methodObject ),
|
||||
new Among ( "mene", 12, -1, "", methodObject ),
|
||||
new Among ( "sene", 12, -1, "", methodObject ),
|
||||
new Among ( "tene", 12, -1, "", methodObject ),
|
||||
new Among ( "vene", 12, -1, "", methodObject ),
|
||||
new Among ( "ci", -1, -1, "", methodObject ),
|
||||
new Among ( "li", -1, -1, "", methodObject ),
|
||||
new Among ( "celi", 20, -1, "", methodObject ),
|
||||
new Among ( "glieli", 20, -1, "", methodObject ),
|
||||
new Among ( "meli", 20, -1, "", methodObject ),
|
||||
new Among ( "teli", 20, -1, "", methodObject ),
|
||||
new Among ( "veli", 20, -1, "", methodObject ),
|
||||
new Among ( "gli", 20, -1, "", methodObject ),
|
||||
new Among ( "mi", -1, -1, "", methodObject ),
|
||||
new Among ( "si", -1, -1, "", methodObject ),
|
||||
new Among ( "ti", -1, -1, "", methodObject ),
|
||||
new Among ( "vi", -1, -1, "", methodObject ),
|
||||
new Among ( "lo", -1, -1, "", methodObject ),
|
||||
new Among ( "celo", 31, -1, "", methodObject ),
|
||||
new Among ( "glielo", 31, -1, "", methodObject ),
|
||||
new Among ( "melo", 31, -1, "", methodObject ),
|
||||
new Among ( "telo", 31, -1, "", methodObject ),
|
||||
new Among ( "velo", 31, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "ando", -1, 1, "", this),
|
||||
new Among ( "endo", -1, 1, "", this),
|
||||
new Among ( "ar", -1, 2, "", this),
|
||||
new Among ( "er", -1, 2, "", this),
|
||||
new Among ( "ir", -1, 2, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "ando", -1, 1, "", methodObject ),
|
||||
new Among ( "endo", -1, 1, "", methodObject ),
|
||||
new Among ( "ar", -1, 2, "", methodObject ),
|
||||
new Among ( "er", -1, 2, "", methodObject ),
|
||||
new Among ( "ir", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "ic", -1, -1, "", this),
|
||||
new Among ( "abil", -1, -1, "", this),
|
||||
new Among ( "os", -1, -1, "", this),
|
||||
new Among ( "iv", -1, 1, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "ic", -1, -1, "", methodObject ),
|
||||
new Among ( "abil", -1, -1, "", methodObject ),
|
||||
new Among ( "os", -1, -1, "", methodObject ),
|
||||
new Among ( "iv", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "ic", -1, 1, "", this),
|
||||
new Among ( "abil", -1, 1, "", this),
|
||||
new Among ( "iv", -1, 1, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "ic", -1, 1, "", methodObject ),
|
||||
new Among ( "abil", -1, 1, "", methodObject ),
|
||||
new Among ( "iv", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_6[] = {
|
||||
new Among ( "ica", -1, 1, "", this),
|
||||
new Among ( "logia", -1, 3, "", this),
|
||||
new Among ( "osa", -1, 1, "", this),
|
||||
new Among ( "ista", -1, 1, "", this),
|
||||
new Among ( "iva", -1, 9, "", this),
|
||||
new Among ( "anza", -1, 1, "", this),
|
||||
new Among ( "enza", -1, 5, "", this),
|
||||
new Among ( "ice", -1, 1, "", this),
|
||||
new Among ( "atrice", 7, 1, "", this),
|
||||
new Among ( "iche", -1, 1, "", this),
|
||||
new Among ( "logie", -1, 3, "", this),
|
||||
new Among ( "abile", -1, 1, "", this),
|
||||
new Among ( "ibile", -1, 1, "", this),
|
||||
new Among ( "usione", -1, 4, "", this),
|
||||
new Among ( "azione", -1, 2, "", this),
|
||||
new Among ( "uzione", -1, 4, "", this),
|
||||
new Among ( "atore", -1, 2, "", this),
|
||||
new Among ( "ose", -1, 1, "", this),
|
||||
new Among ( "ante", -1, 1, "", this),
|
||||
new Among ( "mente", -1, 1, "", this),
|
||||
new Among ( "amente", 19, 7, "", this),
|
||||
new Among ( "iste", -1, 1, "", this),
|
||||
new Among ( "ive", -1, 9, "", this),
|
||||
new Among ( "anze", -1, 1, "", this),
|
||||
new Among ( "enze", -1, 5, "", this),
|
||||
new Among ( "ici", -1, 1, "", this),
|
||||
new Among ( "atrici", 25, 1, "", this),
|
||||
new Among ( "ichi", -1, 1, "", this),
|
||||
new Among ( "abili", -1, 1, "", this),
|
||||
new Among ( "ibili", -1, 1, "", this),
|
||||
new Among ( "ismi", -1, 1, "", this),
|
||||
new Among ( "usioni", -1, 4, "", this),
|
||||
new Among ( "azioni", -1, 2, "", this),
|
||||
new Among ( "uzioni", -1, 4, "", this),
|
||||
new Among ( "atori", -1, 2, "", this),
|
||||
new Among ( "osi", -1, 1, "", this),
|
||||
new Among ( "anti", -1, 1, "", this),
|
||||
new Among ( "amenti", -1, 6, "", this),
|
||||
new Among ( "imenti", -1, 6, "", this),
|
||||
new Among ( "isti", -1, 1, "", this),
|
||||
new Among ( "ivi", -1, 9, "", this),
|
||||
new Among ( "ico", -1, 1, "", this),
|
||||
new Among ( "ismo", -1, 1, "", this),
|
||||
new Among ( "oso", -1, 1, "", this),
|
||||
new Among ( "amento", -1, 6, "", this),
|
||||
new Among ( "imento", -1, 6, "", this),
|
||||
new Among ( "ivo", -1, 9, "", this),
|
||||
new Among ( "it\u00E0", -1, 8, "", this),
|
||||
new Among ( "ist\u00E0", -1, 1, "", this),
|
||||
new Among ( "ist\u00E8", -1, 1, "", this),
|
||||
new Among ( "ist\u00EC", -1, 1, "", this)
|
||||
private final static Among a_6[] = {
|
||||
new Among ( "ica", -1, 1, "", methodObject ),
|
||||
new Among ( "logia", -1, 3, "", methodObject ),
|
||||
new Among ( "osa", -1, 1, "", methodObject ),
|
||||
new Among ( "ista", -1, 1, "", methodObject ),
|
||||
new Among ( "iva", -1, 9, "", methodObject ),
|
||||
new Among ( "anza", -1, 1, "", methodObject ),
|
||||
new Among ( "enza", -1, 5, "", methodObject ),
|
||||
new Among ( "ice", -1, 1, "", methodObject ),
|
||||
new Among ( "atrice", 7, 1, "", methodObject ),
|
||||
new Among ( "iche", -1, 1, "", methodObject ),
|
||||
new Among ( "logie", -1, 3, "", methodObject ),
|
||||
new Among ( "abile", -1, 1, "", methodObject ),
|
||||
new Among ( "ibile", -1, 1, "", methodObject ),
|
||||
new Among ( "usione", -1, 4, "", methodObject ),
|
||||
new Among ( "azione", -1, 2, "", methodObject ),
|
||||
new Among ( "uzione", -1, 4, "", methodObject ),
|
||||
new Among ( "atore", -1, 2, "", methodObject ),
|
||||
new Among ( "ose", -1, 1, "", methodObject ),
|
||||
new Among ( "ante", -1, 1, "", methodObject ),
|
||||
new Among ( "mente", -1, 1, "", methodObject ),
|
||||
new Among ( "amente", 19, 7, "", methodObject ),
|
||||
new Among ( "iste", -1, 1, "", methodObject ),
|
||||
new Among ( "ive", -1, 9, "", methodObject ),
|
||||
new Among ( "anze", -1, 1, "", methodObject ),
|
||||
new Among ( "enze", -1, 5, "", methodObject ),
|
||||
new Among ( "ici", -1, 1, "", methodObject ),
|
||||
new Among ( "atrici", 25, 1, "", methodObject ),
|
||||
new Among ( "ichi", -1, 1, "", methodObject ),
|
||||
new Among ( "abili", -1, 1, "", methodObject ),
|
||||
new Among ( "ibili", -1, 1, "", methodObject ),
|
||||
new Among ( "ismi", -1, 1, "", methodObject ),
|
||||
new Among ( "usioni", -1, 4, "", methodObject ),
|
||||
new Among ( "azioni", -1, 2, "", methodObject ),
|
||||
new Among ( "uzioni", -1, 4, "", methodObject ),
|
||||
new Among ( "atori", -1, 2, "", methodObject ),
|
||||
new Among ( "osi", -1, 1, "", methodObject ),
|
||||
new Among ( "anti", -1, 1, "", methodObject ),
|
||||
new Among ( "amenti", -1, 6, "", methodObject ),
|
||||
new Among ( "imenti", -1, 6, "", methodObject ),
|
||||
new Among ( "isti", -1, 1, "", methodObject ),
|
||||
new Among ( "ivi", -1, 9, "", methodObject ),
|
||||
new Among ( "ico", -1, 1, "", methodObject ),
|
||||
new Among ( "ismo", -1, 1, "", methodObject ),
|
||||
new Among ( "oso", -1, 1, "", methodObject ),
|
||||
new Among ( "amento", -1, 6, "", methodObject ),
|
||||
new Among ( "imento", -1, 6, "", methodObject ),
|
||||
new Among ( "ivo", -1, 9, "", methodObject ),
|
||||
new Among ( "it\u00E0", -1, 8, "", methodObject ),
|
||||
new Among ( "ist\u00E0", -1, 1, "", methodObject ),
|
||||
new Among ( "ist\u00E8", -1, 1, "", methodObject ),
|
||||
new Among ( "ist\u00EC", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_7[] = {
|
||||
new Among ( "isca", -1, 1, "", this),
|
||||
new Among ( "enda", -1, 1, "", this),
|
||||
new Among ( "ata", -1, 1, "", this),
|
||||
new Among ( "ita", -1, 1, "", this),
|
||||
new Among ( "uta", -1, 1, "", this),
|
||||
new Among ( "ava", -1, 1, "", this),
|
||||
new Among ( "eva", -1, 1, "", this),
|
||||
new Among ( "iva", -1, 1, "", this),
|
||||
new Among ( "erebbe", -1, 1, "", this),
|
||||
new Among ( "irebbe", -1, 1, "", this),
|
||||
new Among ( "isce", -1, 1, "", this),
|
||||
new Among ( "ende", -1, 1, "", this),
|
||||
new Among ( "are", -1, 1, "", this),
|
||||
new Among ( "ere", -1, 1, "", this),
|
||||
new Among ( "ire", -1, 1, "", this),
|
||||
new Among ( "asse", -1, 1, "", this),
|
||||
new Among ( "ate", -1, 1, "", this),
|
||||
new Among ( "avate", 16, 1, "", this),
|
||||
new Among ( "evate", 16, 1, "", this),
|
||||
new Among ( "ivate", 16, 1, "", this),
|
||||
new Among ( "ete", -1, 1, "", this),
|
||||
new Among ( "erete", 20, 1, "", this),
|
||||
new Among ( "irete", 20, 1, "", this),
|
||||
new Among ( "ite", -1, 1, "", this),
|
||||
new Among ( "ereste", -1, 1, "", this),
|
||||
new Among ( "ireste", -1, 1, "", this),
|
||||
new Among ( "ute", -1, 1, "", this),
|
||||
new Among ( "erai", -1, 1, "", this),
|
||||
new Among ( "irai", -1, 1, "", this),
|
||||
new Among ( "isci", -1, 1, "", this),
|
||||
new Among ( "endi", -1, 1, "", this),
|
||||
new Among ( "erei", -1, 1, "", this),
|
||||
new Among ( "irei", -1, 1, "", this),
|
||||
new Among ( "assi", -1, 1, "", this),
|
||||
new Among ( "ati", -1, 1, "", this),
|
||||
new Among ( "iti", -1, 1, "", this),
|
||||
new Among ( "eresti", -1, 1, "", this),
|
||||
new Among ( "iresti", -1, 1, "", this),
|
||||
new Among ( "uti", -1, 1, "", this),
|
||||
new Among ( "avi", -1, 1, "", this),
|
||||
new Among ( "evi", -1, 1, "", this),
|
||||
new Among ( "ivi", -1, 1, "", this),
|
||||
new Among ( "isco", -1, 1, "", this),
|
||||
new Among ( "ando", -1, 1, "", this),
|
||||
new Among ( "endo", -1, 1, "", this),
|
||||
new Among ( "Yamo", -1, 1, "", this),
|
||||
new Among ( "iamo", -1, 1, "", this),
|
||||
new Among ( "avamo", -1, 1, "", this),
|
||||
new Among ( "evamo", -1, 1, "", this),
|
||||
new Among ( "ivamo", -1, 1, "", this),
|
||||
new Among ( "eremo", -1, 1, "", this),
|
||||
new Among ( "iremo", -1, 1, "", this),
|
||||
new Among ( "assimo", -1, 1, "", this),
|
||||
new Among ( "ammo", -1, 1, "", this),
|
||||
new Among ( "emmo", -1, 1, "", this),
|
||||
new Among ( "eremmo", 54, 1, "", this),
|
||||
new Among ( "iremmo", 54, 1, "", this),
|
||||
new Among ( "immo", -1, 1, "", this),
|
||||
new Among ( "ano", -1, 1, "", this),
|
||||
new Among ( "iscano", 58, 1, "", this),
|
||||
new Among ( "avano", 58, 1, "", this),
|
||||
new Among ( "evano", 58, 1, "", this),
|
||||
new Among ( "ivano", 58, 1, "", this),
|
||||
new Among ( "eranno", -1, 1, "", this),
|
||||
new Among ( "iranno", -1, 1, "", this),
|
||||
new Among ( "ono", -1, 1, "", this),
|
||||
new Among ( "iscono", 65, 1, "", this),
|
||||
new Among ( "arono", 65, 1, "", this),
|
||||
new Among ( "erono", 65, 1, "", this),
|
||||
new Among ( "irono", 65, 1, "", this),
|
||||
new Among ( "erebbero", -1, 1, "", this),
|
||||
new Among ( "irebbero", -1, 1, "", this),
|
||||
new Among ( "assero", -1, 1, "", this),
|
||||
new Among ( "essero", -1, 1, "", this),
|
||||
new Among ( "issero", -1, 1, "", this),
|
||||
new Among ( "ato", -1, 1, "", this),
|
||||
new Among ( "ito", -1, 1, "", this),
|
||||
new Among ( "uto", -1, 1, "", this),
|
||||
new Among ( "avo", -1, 1, "", this),
|
||||
new Among ( "evo", -1, 1, "", this),
|
||||
new Among ( "ivo", -1, 1, "", this),
|
||||
new Among ( "ar", -1, 1, "", this),
|
||||
new Among ( "ir", -1, 1, "", this),
|
||||
new Among ( "er\u00E0", -1, 1, "", this),
|
||||
new Among ( "ir\u00E0", -1, 1, "", this),
|
||||
new Among ( "er\u00F2", -1, 1, "", this),
|
||||
new Among ( "ir\u00F2", -1, 1, "", this)
|
||||
private final static Among a_7[] = {
|
||||
new Among ( "isca", -1, 1, "", methodObject ),
|
||||
new Among ( "enda", -1, 1, "", methodObject ),
|
||||
new Among ( "ata", -1, 1, "", methodObject ),
|
||||
new Among ( "ita", -1, 1, "", methodObject ),
|
||||
new Among ( "uta", -1, 1, "", methodObject ),
|
||||
new Among ( "ava", -1, 1, "", methodObject ),
|
||||
new Among ( "eva", -1, 1, "", methodObject ),
|
||||
new Among ( "iva", -1, 1, "", methodObject ),
|
||||
new Among ( "erebbe", -1, 1, "", methodObject ),
|
||||
new Among ( "irebbe", -1, 1, "", methodObject ),
|
||||
new Among ( "isce", -1, 1, "", methodObject ),
|
||||
new Among ( "ende", -1, 1, "", methodObject ),
|
||||
new Among ( "are", -1, 1, "", methodObject ),
|
||||
new Among ( "ere", -1, 1, "", methodObject ),
|
||||
new Among ( "ire", -1, 1, "", methodObject ),
|
||||
new Among ( "asse", -1, 1, "", methodObject ),
|
||||
new Among ( "ate", -1, 1, "", methodObject ),
|
||||
new Among ( "avate", 16, 1, "", methodObject ),
|
||||
new Among ( "evate", 16, 1, "", methodObject ),
|
||||
new Among ( "ivate", 16, 1, "", methodObject ),
|
||||
new Among ( "ete", -1, 1, "", methodObject ),
|
||||
new Among ( "erete", 20, 1, "", methodObject ),
|
||||
new Among ( "irete", 20, 1, "", methodObject ),
|
||||
new Among ( "ite", -1, 1, "", methodObject ),
|
||||
new Among ( "ereste", -1, 1, "", methodObject ),
|
||||
new Among ( "ireste", -1, 1, "", methodObject ),
|
||||
new Among ( "ute", -1, 1, "", methodObject ),
|
||||
new Among ( "erai", -1, 1, "", methodObject ),
|
||||
new Among ( "irai", -1, 1, "", methodObject ),
|
||||
new Among ( "isci", -1, 1, "", methodObject ),
|
||||
new Among ( "endi", -1, 1, "", methodObject ),
|
||||
new Among ( "erei", -1, 1, "", methodObject ),
|
||||
new Among ( "irei", -1, 1, "", methodObject ),
|
||||
new Among ( "assi", -1, 1, "", methodObject ),
|
||||
new Among ( "ati", -1, 1, "", methodObject ),
|
||||
new Among ( "iti", -1, 1, "", methodObject ),
|
||||
new Among ( "eresti", -1, 1, "", methodObject ),
|
||||
new Among ( "iresti", -1, 1, "", methodObject ),
|
||||
new Among ( "uti", -1, 1, "", methodObject ),
|
||||
new Among ( "avi", -1, 1, "", methodObject ),
|
||||
new Among ( "evi", -1, 1, "", methodObject ),
|
||||
new Among ( "ivi", -1, 1, "", methodObject ),
|
||||
new Among ( "isco", -1, 1, "", methodObject ),
|
||||
new Among ( "ando", -1, 1, "", methodObject ),
|
||||
new Among ( "endo", -1, 1, "", methodObject ),
|
||||
new Among ( "Yamo", -1, 1, "", methodObject ),
|
||||
new Among ( "iamo", -1, 1, "", methodObject ),
|
||||
new Among ( "avamo", -1, 1, "", methodObject ),
|
||||
new Among ( "evamo", -1, 1, "", methodObject ),
|
||||
new Among ( "ivamo", -1, 1, "", methodObject ),
|
||||
new Among ( "eremo", -1, 1, "", methodObject ),
|
||||
new Among ( "iremo", -1, 1, "", methodObject ),
|
||||
new Among ( "assimo", -1, 1, "", methodObject ),
|
||||
new Among ( "ammo", -1, 1, "", methodObject ),
|
||||
new Among ( "emmo", -1, 1, "", methodObject ),
|
||||
new Among ( "eremmo", 54, 1, "", methodObject ),
|
||||
new Among ( "iremmo", 54, 1, "", methodObject ),
|
||||
new Among ( "immo", -1, 1, "", methodObject ),
|
||||
new Among ( "ano", -1, 1, "", methodObject ),
|
||||
new Among ( "iscano", 58, 1, "", methodObject ),
|
||||
new Among ( "avano", 58, 1, "", methodObject ),
|
||||
new Among ( "evano", 58, 1, "", methodObject ),
|
||||
new Among ( "ivano", 58, 1, "", methodObject ),
|
||||
new Among ( "eranno", -1, 1, "", methodObject ),
|
||||
new Among ( "iranno", -1, 1, "", methodObject ),
|
||||
new Among ( "ono", -1, 1, "", methodObject ),
|
||||
new Among ( "iscono", 65, 1, "", methodObject ),
|
||||
new Among ( "arono", 65, 1, "", methodObject ),
|
||||
new Among ( "erono", 65, 1, "", methodObject ),
|
||||
new Among ( "irono", 65, 1, "", methodObject ),
|
||||
new Among ( "erebbero", -1, 1, "", methodObject ),
|
||||
new Among ( "irebbero", -1, 1, "", methodObject ),
|
||||
new Among ( "assero", -1, 1, "", methodObject ),
|
||||
new Among ( "essero", -1, 1, "", methodObject ),
|
||||
new Among ( "issero", -1, 1, "", methodObject ),
|
||||
new Among ( "ato", -1, 1, "", methodObject ),
|
||||
new Among ( "ito", -1, 1, "", methodObject ),
|
||||
new Among ( "uto", -1, 1, "", methodObject ),
|
||||
new Among ( "avo", -1, 1, "", methodObject ),
|
||||
new Among ( "evo", -1, 1, "", methodObject ),
|
||||
new Among ( "ivo", -1, 1, "", methodObject ),
|
||||
new Among ( "ar", -1, 1, "", methodObject ),
|
||||
new Among ( "ir", -1, 1, "", methodObject ),
|
||||
new Among ( "er\u00E0", -1, 1, "", methodObject ),
|
||||
new Among ( "ir\u00E0", -1, 1, "", methodObject ),
|
||||
new Among ( "er\u00F2", -1, 1, "", methodObject ),
|
||||
new Among ( "ir\u00F2", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 128, 128, 8, 2, 1 };
|
||||
|
@ -1176,5 +1183,15 @@ public class ItalianStemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof ItalianStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return ItalianStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,114 +1,121 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class KpStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "nde", -1, 7, "", this),
|
||||
new Among ( "en", -1, 6, "", this),
|
||||
new Among ( "s", -1, 2, "", this),
|
||||
new Among ( "'s", 2, 1, "", this),
|
||||
new Among ( "es", 2, 4, "", this),
|
||||
new Among ( "ies", 4, 3, "", this),
|
||||
new Among ( "aus", 2, 5, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static KpStemmer methodObject = new KpStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "nde", -1, 7, "", methodObject ),
|
||||
new Among ( "en", -1, 6, "", methodObject ),
|
||||
new Among ( "s", -1, 2, "", methodObject ),
|
||||
new Among ( "'s", 2, 1, "", methodObject ),
|
||||
new Among ( "es", 2, 4, "", methodObject ),
|
||||
new Among ( "ies", 4, 3, "", methodObject ),
|
||||
new Among ( "aus", 2, 5, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "de", -1, 5, "", this),
|
||||
new Among ( "ge", -1, 2, "", this),
|
||||
new Among ( "ische", -1, 4, "", this),
|
||||
new Among ( "je", -1, 1, "", this),
|
||||
new Among ( "lijke", -1, 3, "", this),
|
||||
new Among ( "le", -1, 9, "", this),
|
||||
new Among ( "ene", -1, 10, "", this),
|
||||
new Among ( "re", -1, 8, "", this),
|
||||
new Among ( "se", -1, 7, "", this),
|
||||
new Among ( "te", -1, 6, "", this),
|
||||
new Among ( "ieve", -1, 11, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "de", -1, 5, "", methodObject ),
|
||||
new Among ( "ge", -1, 2, "", methodObject ),
|
||||
new Among ( "ische", -1, 4, "", methodObject ),
|
||||
new Among ( "je", -1, 1, "", methodObject ),
|
||||
new Among ( "lijke", -1, 3, "", methodObject ),
|
||||
new Among ( "le", -1, 9, "", methodObject ),
|
||||
new Among ( "ene", -1, 10, "", methodObject ),
|
||||
new Among ( "re", -1, 8, "", methodObject ),
|
||||
new Among ( "se", -1, 7, "", methodObject ),
|
||||
new Among ( "te", -1, 6, "", methodObject ),
|
||||
new Among ( "ieve", -1, 11, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "heid", -1, 3, "", this),
|
||||
new Among ( "fie", -1, 7, "", this),
|
||||
new Among ( "gie", -1, 8, "", this),
|
||||
new Among ( "atie", -1, 1, "", this),
|
||||
new Among ( "isme", -1, 5, "", this),
|
||||
new Among ( "ing", -1, 5, "", this),
|
||||
new Among ( "arij", -1, 6, "", this),
|
||||
new Among ( "erij", -1, 5, "", this),
|
||||
new Among ( "sel", -1, 3, "", this),
|
||||
new Among ( "rder", -1, 4, "", this),
|
||||
new Among ( "ster", -1, 3, "", this),
|
||||
new Among ( "iteit", -1, 2, "", this),
|
||||
new Among ( "dst", -1, 10, "", this),
|
||||
new Among ( "tst", -1, 9, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "heid", -1, 3, "", methodObject ),
|
||||
new Among ( "fie", -1, 7, "", methodObject ),
|
||||
new Among ( "gie", -1, 8, "", methodObject ),
|
||||
new Among ( "atie", -1, 1, "", methodObject ),
|
||||
new Among ( "isme", -1, 5, "", methodObject ),
|
||||
new Among ( "ing", -1, 5, "", methodObject ),
|
||||
new Among ( "arij", -1, 6, "", methodObject ),
|
||||
new Among ( "erij", -1, 5, "", methodObject ),
|
||||
new Among ( "sel", -1, 3, "", methodObject ),
|
||||
new Among ( "rder", -1, 4, "", methodObject ),
|
||||
new Among ( "ster", -1, 3, "", methodObject ),
|
||||
new Among ( "iteit", -1, 2, "", methodObject ),
|
||||
new Among ( "dst", -1, 10, "", methodObject ),
|
||||
new Among ( "tst", -1, 9, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "end", -1, 10, "", this),
|
||||
new Among ( "atief", -1, 2, "", this),
|
||||
new Among ( "erig", -1, 10, "", this),
|
||||
new Among ( "achtig", -1, 9, "", this),
|
||||
new Among ( "ioneel", -1, 1, "", this),
|
||||
new Among ( "baar", -1, 3, "", this),
|
||||
new Among ( "laar", -1, 5, "", this),
|
||||
new Among ( "naar", -1, 4, "", this),
|
||||
new Among ( "raar", -1, 6, "", this),
|
||||
new Among ( "eriger", -1, 10, "", this),
|
||||
new Among ( "achtiger", -1, 9, "", this),
|
||||
new Among ( "lijker", -1, 8, "", this),
|
||||
new Among ( "tant", -1, 7, "", this),
|
||||
new Among ( "erigst", -1, 10, "", this),
|
||||
new Among ( "achtigst", -1, 9, "", this),
|
||||
new Among ( "lijkst", -1, 8, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "end", -1, 10, "", methodObject ),
|
||||
new Among ( "atief", -1, 2, "", methodObject ),
|
||||
new Among ( "erig", -1, 10, "", methodObject ),
|
||||
new Among ( "achtig", -1, 9, "", methodObject ),
|
||||
new Among ( "ioneel", -1, 1, "", methodObject ),
|
||||
new Among ( "baar", -1, 3, "", methodObject ),
|
||||
new Among ( "laar", -1, 5, "", methodObject ),
|
||||
new Among ( "naar", -1, 4, "", methodObject ),
|
||||
new Among ( "raar", -1, 6, "", methodObject ),
|
||||
new Among ( "eriger", -1, 10, "", methodObject ),
|
||||
new Among ( "achtiger", -1, 9, "", methodObject ),
|
||||
new Among ( "lijker", -1, 8, "", methodObject ),
|
||||
new Among ( "tant", -1, 7, "", methodObject ),
|
||||
new Among ( "erigst", -1, 10, "", methodObject ),
|
||||
new Among ( "achtigst", -1, 9, "", methodObject ),
|
||||
new Among ( "lijkst", -1, 8, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "ig", -1, 1, "", this),
|
||||
new Among ( "iger", -1, 1, "", this),
|
||||
new Among ( "igst", -1, 1, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "ig", -1, 1, "", methodObject ),
|
||||
new Among ( "iger", -1, 1, "", methodObject ),
|
||||
new Among ( "igst", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "ft", -1, 2, "", this),
|
||||
new Among ( "kt", -1, 1, "", this),
|
||||
new Among ( "pt", -1, 3, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "ft", -1, 2, "", methodObject ),
|
||||
new Among ( "kt", -1, 1, "", methodObject ),
|
||||
new Among ( "pt", -1, 3, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_6[] = {
|
||||
new Among ( "bb", -1, 1, "", this),
|
||||
new Among ( "cc", -1, 2, "", this),
|
||||
new Among ( "dd", -1, 3, "", this),
|
||||
new Among ( "ff", -1, 4, "", this),
|
||||
new Among ( "gg", -1, 5, "", this),
|
||||
new Among ( "hh", -1, 6, "", this),
|
||||
new Among ( "jj", -1, 7, "", this),
|
||||
new Among ( "kk", -1, 8, "", this),
|
||||
new Among ( "ll", -1, 9, "", this),
|
||||
new Among ( "mm", -1, 10, "", this),
|
||||
new Among ( "nn", -1, 11, "", this),
|
||||
new Among ( "pp", -1, 12, "", this),
|
||||
new Among ( "qq", -1, 13, "", this),
|
||||
new Among ( "rr", -1, 14, "", this),
|
||||
new Among ( "ss", -1, 15, "", this),
|
||||
new Among ( "tt", -1, 16, "", this),
|
||||
new Among ( "v", -1, 21, "", this),
|
||||
new Among ( "vv", 16, 17, "", this),
|
||||
new Among ( "ww", -1, 18, "", this),
|
||||
new Among ( "xx", -1, 19, "", this),
|
||||
new Among ( "z", -1, 22, "", this),
|
||||
new Among ( "zz", 20, 20, "", this)
|
||||
private final static Among a_6[] = {
|
||||
new Among ( "bb", -1, 1, "", methodObject ),
|
||||
new Among ( "cc", -1, 2, "", methodObject ),
|
||||
new Among ( "dd", -1, 3, "", methodObject ),
|
||||
new Among ( "ff", -1, 4, "", methodObject ),
|
||||
new Among ( "gg", -1, 5, "", methodObject ),
|
||||
new Among ( "hh", -1, 6, "", methodObject ),
|
||||
new Among ( "jj", -1, 7, "", methodObject ),
|
||||
new Among ( "kk", -1, 8, "", methodObject ),
|
||||
new Among ( "ll", -1, 9, "", methodObject ),
|
||||
new Among ( "mm", -1, 10, "", methodObject ),
|
||||
new Among ( "nn", -1, 11, "", methodObject ),
|
||||
new Among ( "pp", -1, 12, "", methodObject ),
|
||||
new Among ( "qq", -1, 13, "", methodObject ),
|
||||
new Among ( "rr", -1, 14, "", methodObject ),
|
||||
new Among ( "ss", -1, 15, "", methodObject ),
|
||||
new Among ( "tt", -1, 16, "", methodObject ),
|
||||
new Among ( "v", -1, 21, "", methodObject ),
|
||||
new Among ( "vv", 16, 17, "", methodObject ),
|
||||
new Among ( "ww", -1, 18, "", methodObject ),
|
||||
new Among ( "xx", -1, 19, "", methodObject ),
|
||||
new Among ( "z", -1, 22, "", methodObject ),
|
||||
new Among ( "zz", 20, 20, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_7[] = {
|
||||
new Among ( "d", -1, 1, "", this),
|
||||
new Among ( "t", -1, 2, "", this)
|
||||
private final static Among a_7[] = {
|
||||
new Among ( "d", -1, 1, "", methodObject ),
|
||||
new Among ( "t", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 1 };
|
||||
|
@ -125,7 +132,7 @@ public class KpStemmer extends SnowballProgram {
|
|||
private int I_p2;
|
||||
private int I_p1;
|
||||
private int I_x;
|
||||
private StringBuilder S_ch = new StringBuilder();
|
||||
private java.lang.StringBuilder S_ch = new java.lang.StringBuilder();
|
||||
|
||||
private void copy_from(KpStemmer other) {
|
||||
B_GE_removed = other.B_GE_removed;
|
||||
|
@ -2177,5 +2184,15 @@ public class KpStemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof KpStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return KpStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,371 +1,378 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class LovinsStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "d", -1, -1, "", this),
|
||||
new Among ( "f", -1, -1, "", this),
|
||||
new Among ( "ph", -1, -1, "", this),
|
||||
new Among ( "th", -1, -1, "", this),
|
||||
new Among ( "l", -1, -1, "", this),
|
||||
new Among ( "er", -1, -1, "", this),
|
||||
new Among ( "or", -1, -1, "", this),
|
||||
new Among ( "es", -1, -1, "", this),
|
||||
new Among ( "t", -1, -1, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static LovinsStemmer methodObject = new LovinsStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "d", -1, -1, "", methodObject ),
|
||||
new Among ( "f", -1, -1, "", methodObject ),
|
||||
new Among ( "ph", -1, -1, "", methodObject ),
|
||||
new Among ( "th", -1, -1, "", methodObject ),
|
||||
new Among ( "l", -1, -1, "", methodObject ),
|
||||
new Among ( "er", -1, -1, "", methodObject ),
|
||||
new Among ( "or", -1, -1, "", methodObject ),
|
||||
new Among ( "es", -1, -1, "", methodObject ),
|
||||
new Among ( "t", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "s'", -1, 1, "r_A", this),
|
||||
new Among ( "a", -1, 1, "r_A", this),
|
||||
new Among ( "ia", 1, 1, "r_A", this),
|
||||
new Among ( "ata", 1, 1, "r_A", this),
|
||||
new Among ( "ic", -1, 1, "r_A", this),
|
||||
new Among ( "aic", 4, 1, "r_A", this),
|
||||
new Among ( "allic", 4, 1, "r_BB", this),
|
||||
new Among ( "aric", 4, 1, "r_A", this),
|
||||
new Among ( "atic", 4, 1, "r_B", this),
|
||||
new Among ( "itic", 4, 1, "r_H", this),
|
||||
new Among ( "antic", 4, 1, "r_C", this),
|
||||
new Among ( "istic", 4, 1, "r_A", this),
|
||||
new Among ( "alistic", 11, 1, "r_B", this),
|
||||
new Among ( "aristic", 11, 1, "r_A", this),
|
||||
new Among ( "ivistic", 11, 1, "r_A", this),
|
||||
new Among ( "ed", -1, 1, "r_E", this),
|
||||
new Among ( "anced", 15, 1, "r_B", this),
|
||||
new Among ( "enced", 15, 1, "r_A", this),
|
||||
new Among ( "ished", 15, 1, "r_A", this),
|
||||
new Among ( "ied", 15, 1, "r_A", this),
|
||||
new Among ( "ened", 15, 1, "r_E", this),
|
||||
new Among ( "ioned", 15, 1, "r_A", this),
|
||||
new Among ( "ated", 15, 1, "r_I", this),
|
||||
new Among ( "ented", 15, 1, "r_C", this),
|
||||
new Among ( "ized", 15, 1, "r_F", this),
|
||||
new Among ( "arized", 24, 1, "r_A", this),
|
||||
new Among ( "oid", -1, 1, "r_A", this),
|
||||
new Among ( "aroid", 26, 1, "r_A", this),
|
||||
new Among ( "hood", -1, 1, "r_A", this),
|
||||
new Among ( "ehood", 28, 1, "r_A", this),
|
||||
new Among ( "ihood", 28, 1, "r_A", this),
|
||||
new Among ( "elihood", 30, 1, "r_E", this),
|
||||
new Among ( "ward", -1, 1, "r_A", this),
|
||||
new Among ( "e", -1, 1, "r_A", this),
|
||||
new Among ( "ae", 33, 1, "r_A", this),
|
||||
new Among ( "ance", 33, 1, "r_B", this),
|
||||
new Among ( "icance", 35, 1, "r_A", this),
|
||||
new Among ( "ence", 33, 1, "r_A", this),
|
||||
new Among ( "ide", 33, 1, "r_L", this),
|
||||
new Among ( "icide", 38, 1, "r_A", this),
|
||||
new Among ( "otide", 38, 1, "r_A", this),
|
||||
new Among ( "age", 33, 1, "r_B", this),
|
||||
new Among ( "able", 33, 1, "r_A", this),
|
||||
new Among ( "atable", 42, 1, "r_A", this),
|
||||
new Among ( "izable", 42, 1, "r_E", this),
|
||||
new Among ( "arizable", 44, 1, "r_A", this),
|
||||
new Among ( "ible", 33, 1, "r_A", this),
|
||||
new Among ( "encible", 46, 1, "r_A", this),
|
||||
new Among ( "ene", 33, 1, "r_E", this),
|
||||
new Among ( "ine", 33, 1, "r_M", this),
|
||||
new Among ( "idine", 49, 1, "r_I", this),
|
||||
new Among ( "one", 33, 1, "r_R", this),
|
||||
new Among ( "ature", 33, 1, "r_E", this),
|
||||
new Among ( "eature", 52, 1, "r_Z", this),
|
||||
new Among ( "ese", 33, 1, "r_A", this),
|
||||
new Among ( "wise", 33, 1, "r_A", this),
|
||||
new Among ( "ate", 33, 1, "r_A", this),
|
||||
new Among ( "entiate", 56, 1, "r_A", this),
|
||||
new Among ( "inate", 56, 1, "r_A", this),
|
||||
new Among ( "ionate", 56, 1, "r_D", this),
|
||||
new Among ( "ite", 33, 1, "r_AA", this),
|
||||
new Among ( "ive", 33, 1, "r_A", this),
|
||||
new Among ( "ative", 61, 1, "r_A", this),
|
||||
new Among ( "ize", 33, 1, "r_F", this),
|
||||
new Among ( "alize", 63, 1, "r_A", this),
|
||||
new Among ( "icalize", 64, 1, "r_A", this),
|
||||
new Among ( "ialize", 64, 1, "r_A", this),
|
||||
new Among ( "entialize", 66, 1, "r_A", this),
|
||||
new Among ( "ionalize", 64, 1, "r_A", this),
|
||||
new Among ( "arize", 63, 1, "r_A", this),
|
||||
new Among ( "ing", -1, 1, "r_N", this),
|
||||
new Among ( "ancing", 70, 1, "r_B", this),
|
||||
new Among ( "encing", 70, 1, "r_A", this),
|
||||
new Among ( "aging", 70, 1, "r_B", this),
|
||||
new Among ( "ening", 70, 1, "r_E", this),
|
||||
new Among ( "ioning", 70, 1, "r_A", this),
|
||||
new Among ( "ating", 70, 1, "r_I", this),
|
||||
new Among ( "enting", 70, 1, "r_C", this),
|
||||
new Among ( "ying", 70, 1, "r_B", this),
|
||||
new Among ( "izing", 70, 1, "r_F", this),
|
||||
new Among ( "arizing", 79, 1, "r_A", this),
|
||||
new Among ( "ish", -1, 1, "r_C", this),
|
||||
new Among ( "yish", 81, 1, "r_A", this),
|
||||
new Among ( "i", -1, 1, "r_A", this),
|
||||
new Among ( "al", -1, 1, "r_BB", this),
|
||||
new Among ( "ical", 84, 1, "r_A", this),
|
||||
new Among ( "aical", 85, 1, "r_A", this),
|
||||
new Among ( "istical", 85, 1, "r_A", this),
|
||||
new Among ( "oidal", 84, 1, "r_A", this),
|
||||
new Among ( "eal", 84, 1, "r_Y", this),
|
||||
new Among ( "ial", 84, 1, "r_A", this),
|
||||
new Among ( "ancial", 90, 1, "r_A", this),
|
||||
new Among ( "arial", 90, 1, "r_A", this),
|
||||
new Among ( "ential", 90, 1, "r_A", this),
|
||||
new Among ( "ional", 84, 1, "r_A", this),
|
||||
new Among ( "ational", 94, 1, "r_B", this),
|
||||
new Among ( "izational", 95, 1, "r_A", this),
|
||||
new Among ( "ental", 84, 1, "r_A", this),
|
||||
new Among ( "ful", -1, 1, "r_A", this),
|
||||
new Among ( "eful", 98, 1, "r_A", this),
|
||||
new Among ( "iful", 98, 1, "r_A", this),
|
||||
new Among ( "yl", -1, 1, "r_R", this),
|
||||
new Among ( "ism", -1, 1, "r_B", this),
|
||||
new Among ( "icism", 102, 1, "r_A", this),
|
||||
new Among ( "oidism", 102, 1, "r_A", this),
|
||||
new Among ( "alism", 102, 1, "r_B", this),
|
||||
new Among ( "icalism", 105, 1, "r_A", this),
|
||||
new Among ( "ionalism", 105, 1, "r_A", this),
|
||||
new Among ( "inism", 102, 1, "r_J", this),
|
||||
new Among ( "ativism", 102, 1, "r_A", this),
|
||||
new Among ( "um", -1, 1, "r_U", this),
|
||||
new Among ( "ium", 110, 1, "r_A", this),
|
||||
new Among ( "ian", -1, 1, "r_A", this),
|
||||
new Among ( "ician", 112, 1, "r_A", this),
|
||||
new Among ( "en", -1, 1, "r_F", this),
|
||||
new Among ( "ogen", 114, 1, "r_A", this),
|
||||
new Among ( "on", -1, 1, "r_S", this),
|
||||
new Among ( "ion", 116, 1, "r_Q", this),
|
||||
new Among ( "ation", 117, 1, "r_B", this),
|
||||
new Among ( "ication", 118, 1, "r_G", this),
|
||||
new Among ( "entiation", 118, 1, "r_A", this),
|
||||
new Among ( "ination", 118, 1, "r_A", this),
|
||||
new Among ( "isation", 118, 1, "r_A", this),
|
||||
new Among ( "arisation", 122, 1, "r_A", this),
|
||||
new Among ( "entation", 118, 1, "r_A", this),
|
||||
new Among ( "ization", 118, 1, "r_F", this),
|
||||
new Among ( "arization", 125, 1, "r_A", this),
|
||||
new Among ( "action", 117, 1, "r_G", this),
|
||||
new Among ( "o", -1, 1, "r_A", this),
|
||||
new Among ( "ar", -1, 1, "r_X", this),
|
||||
new Among ( "ear", 129, 1, "r_Y", this),
|
||||
new Among ( "ier", -1, 1, "r_A", this),
|
||||
new Among ( "ariser", -1, 1, "r_A", this),
|
||||
new Among ( "izer", -1, 1, "r_F", this),
|
||||
new Among ( "arizer", 133, 1, "r_A", this),
|
||||
new Among ( "or", -1, 1, "r_T", this),
|
||||
new Among ( "ator", 135, 1, "r_A", this),
|
||||
new Among ( "s", -1, 1, "r_W", this),
|
||||
new Among ( "'s", 137, 1, "r_A", this),
|
||||
new Among ( "as", 137, 1, "r_B", this),
|
||||
new Among ( "ics", 137, 1, "r_A", this),
|
||||
new Among ( "istics", 140, 1, "r_A", this),
|
||||
new Among ( "es", 137, 1, "r_E", this),
|
||||
new Among ( "ances", 142, 1, "r_B", this),
|
||||
new Among ( "ences", 142, 1, "r_A", this),
|
||||
new Among ( "ides", 142, 1, "r_L", this),
|
||||
new Among ( "oides", 145, 1, "r_A", this),
|
||||
new Among ( "ages", 142, 1, "r_B", this),
|
||||
new Among ( "ies", 142, 1, "r_P", this),
|
||||
new Among ( "acies", 148, 1, "r_A", this),
|
||||
new Among ( "ancies", 148, 1, "r_A", this),
|
||||
new Among ( "encies", 148, 1, "r_A", this),
|
||||
new Among ( "aries", 148, 1, "r_A", this),
|
||||
new Among ( "ities", 148, 1, "r_A", this),
|
||||
new Among ( "alities", 153, 1, "r_A", this),
|
||||
new Among ( "ivities", 153, 1, "r_A", this),
|
||||
new Among ( "ines", 142, 1, "r_M", this),
|
||||
new Among ( "nesses", 142, 1, "r_A", this),
|
||||
new Among ( "ates", 142, 1, "r_A", this),
|
||||
new Among ( "atives", 142, 1, "r_A", this),
|
||||
new Among ( "ings", 137, 1, "r_N", this),
|
||||
new Among ( "is", 137, 1, "r_A", this),
|
||||
new Among ( "als", 137, 1, "r_BB", this),
|
||||
new Among ( "ials", 162, 1, "r_A", this),
|
||||
new Among ( "entials", 163, 1, "r_A", this),
|
||||
new Among ( "ionals", 162, 1, "r_A", this),
|
||||
new Among ( "isms", 137, 1, "r_B", this),
|
||||
new Among ( "ians", 137, 1, "r_A", this),
|
||||
new Among ( "icians", 167, 1, "r_A", this),
|
||||
new Among ( "ions", 137, 1, "r_B", this),
|
||||
new Among ( "ations", 169, 1, "r_B", this),
|
||||
new Among ( "arisations", 170, 1, "r_A", this),
|
||||
new Among ( "entations", 170, 1, "r_A", this),
|
||||
new Among ( "izations", 170, 1, "r_A", this),
|
||||
new Among ( "arizations", 173, 1, "r_A", this),
|
||||
new Among ( "ars", 137, 1, "r_O", this),
|
||||
new Among ( "iers", 137, 1, "r_A", this),
|
||||
new Among ( "izers", 137, 1, "r_F", this),
|
||||
new Among ( "ators", 137, 1, "r_A", this),
|
||||
new Among ( "less", 137, 1, "r_A", this),
|
||||
new Among ( "eless", 179, 1, "r_A", this),
|
||||
new Among ( "ness", 137, 1, "r_A", this),
|
||||
new Among ( "eness", 181, 1, "r_E", this),
|
||||
new Among ( "ableness", 182, 1, "r_A", this),
|
||||
new Among ( "eableness", 183, 1, "r_E", this),
|
||||
new Among ( "ibleness", 182, 1, "r_A", this),
|
||||
new Among ( "ateness", 182, 1, "r_A", this),
|
||||
new Among ( "iteness", 182, 1, "r_A", this),
|
||||
new Among ( "iveness", 182, 1, "r_A", this),
|
||||
new Among ( "ativeness", 188, 1, "r_A", this),
|
||||
new Among ( "ingness", 181, 1, "r_A", this),
|
||||
new Among ( "ishness", 181, 1, "r_A", this),
|
||||
new Among ( "iness", 181, 1, "r_A", this),
|
||||
new Among ( "ariness", 192, 1, "r_E", this),
|
||||
new Among ( "alness", 181, 1, "r_A", this),
|
||||
new Among ( "icalness", 194, 1, "r_A", this),
|
||||
new Among ( "antialness", 194, 1, "r_A", this),
|
||||
new Among ( "entialness", 194, 1, "r_A", this),
|
||||
new Among ( "ionalness", 194, 1, "r_A", this),
|
||||
new Among ( "fulness", 181, 1, "r_A", this),
|
||||
new Among ( "lessness", 181, 1, "r_A", this),
|
||||
new Among ( "ousness", 181, 1, "r_A", this),
|
||||
new Among ( "eousness", 201, 1, "r_A", this),
|
||||
new Among ( "iousness", 201, 1, "r_A", this),
|
||||
new Among ( "itousness", 201, 1, "r_A", this),
|
||||
new Among ( "entness", 181, 1, "r_A", this),
|
||||
new Among ( "ants", 137, 1, "r_B", this),
|
||||
new Among ( "ists", 137, 1, "r_A", this),
|
||||
new Among ( "icists", 207, 1, "r_A", this),
|
||||
new Among ( "us", 137, 1, "r_V", this),
|
||||
new Among ( "ous", 209, 1, "r_A", this),
|
||||
new Among ( "eous", 210, 1, "r_A", this),
|
||||
new Among ( "aceous", 211, 1, "r_A", this),
|
||||
new Among ( "antaneous", 211, 1, "r_A", this),
|
||||
new Among ( "ious", 210, 1, "r_A", this),
|
||||
new Among ( "acious", 214, 1, "r_B", this),
|
||||
new Among ( "itous", 210, 1, "r_A", this),
|
||||
new Among ( "ant", -1, 1, "r_B", this),
|
||||
new Among ( "icant", 217, 1, "r_A", this),
|
||||
new Among ( "ent", -1, 1, "r_C", this),
|
||||
new Among ( "ement", 219, 1, "r_A", this),
|
||||
new Among ( "izement", 220, 1, "r_A", this),
|
||||
new Among ( "ist", -1, 1, "r_A", this),
|
||||
new Among ( "icist", 222, 1, "r_A", this),
|
||||
new Among ( "alist", 222, 1, "r_A", this),
|
||||
new Among ( "icalist", 224, 1, "r_A", this),
|
||||
new Among ( "ialist", 224, 1, "r_A", this),
|
||||
new Among ( "ionist", 222, 1, "r_A", this),
|
||||
new Among ( "entist", 222, 1, "r_A", this),
|
||||
new Among ( "y", -1, 1, "r_B", this),
|
||||
new Among ( "acy", 229, 1, "r_A", this),
|
||||
new Among ( "ancy", 229, 1, "r_B", this),
|
||||
new Among ( "ency", 229, 1, "r_A", this),
|
||||
new Among ( "ly", 229, 1, "r_B", this),
|
||||
new Among ( "ealy", 233, 1, "r_Y", this),
|
||||
new Among ( "ably", 233, 1, "r_A", this),
|
||||
new Among ( "ibly", 233, 1, "r_A", this),
|
||||
new Among ( "edly", 233, 1, "r_E", this),
|
||||
new Among ( "iedly", 237, 1, "r_A", this),
|
||||
new Among ( "ely", 233, 1, "r_E", this),
|
||||
new Among ( "ately", 239, 1, "r_A", this),
|
||||
new Among ( "ively", 239, 1, "r_A", this),
|
||||
new Among ( "atively", 241, 1, "r_A", this),
|
||||
new Among ( "ingly", 233, 1, "r_B", this),
|
||||
new Among ( "atingly", 243, 1, "r_A", this),
|
||||
new Among ( "ily", 233, 1, "r_A", this),
|
||||
new Among ( "lily", 245, 1, "r_A", this),
|
||||
new Among ( "arily", 245, 1, "r_A", this),
|
||||
new Among ( "ally", 233, 1, "r_B", this),
|
||||
new Among ( "ically", 248, 1, "r_A", this),
|
||||
new Among ( "aically", 249, 1, "r_A", this),
|
||||
new Among ( "allically", 249, 1, "r_C", this),
|
||||
new Among ( "istically", 249, 1, "r_A", this),
|
||||
new Among ( "alistically", 252, 1, "r_B", this),
|
||||
new Among ( "oidally", 248, 1, "r_A", this),
|
||||
new Among ( "ially", 248, 1, "r_A", this),
|
||||
new Among ( "entially", 255, 1, "r_A", this),
|
||||
new Among ( "ionally", 248, 1, "r_A", this),
|
||||
new Among ( "ationally", 257, 1, "r_B", this),
|
||||
new Among ( "izationally", 258, 1, "r_B", this),
|
||||
new Among ( "entally", 248, 1, "r_A", this),
|
||||
new Among ( "fully", 233, 1, "r_A", this),
|
||||
new Among ( "efully", 261, 1, "r_A", this),
|
||||
new Among ( "ifully", 261, 1, "r_A", this),
|
||||
new Among ( "enly", 233, 1, "r_E", this),
|
||||
new Among ( "arly", 233, 1, "r_K", this),
|
||||
new Among ( "early", 265, 1, "r_Y", this),
|
||||
new Among ( "lessly", 233, 1, "r_A", this),
|
||||
new Among ( "ously", 233, 1, "r_A", this),
|
||||
new Among ( "eously", 268, 1, "r_A", this),
|
||||
new Among ( "iously", 268, 1, "r_A", this),
|
||||
new Among ( "ently", 233, 1, "r_A", this),
|
||||
new Among ( "ary", 229, 1, "r_F", this),
|
||||
new Among ( "ery", 229, 1, "r_E", this),
|
||||
new Among ( "icianry", 229, 1, "r_A", this),
|
||||
new Among ( "atory", 229, 1, "r_A", this),
|
||||
new Among ( "ity", 229, 1, "r_A", this),
|
||||
new Among ( "acity", 276, 1, "r_A", this),
|
||||
new Among ( "icity", 276, 1, "r_A", this),
|
||||
new Among ( "eity", 276, 1, "r_A", this),
|
||||
new Among ( "ality", 276, 1, "r_A", this),
|
||||
new Among ( "icality", 280, 1, "r_A", this),
|
||||
new Among ( "iality", 280, 1, "r_A", this),
|
||||
new Among ( "antiality", 282, 1, "r_A", this),
|
||||
new Among ( "entiality", 282, 1, "r_A", this),
|
||||
new Among ( "ionality", 280, 1, "r_A", this),
|
||||
new Among ( "elity", 276, 1, "r_A", this),
|
||||
new Among ( "ability", 276, 1, "r_A", this),
|
||||
new Among ( "izability", 287, 1, "r_A", this),
|
||||
new Among ( "arizability", 288, 1, "r_A", this),
|
||||
new Among ( "ibility", 276, 1, "r_A", this),
|
||||
new Among ( "inity", 276, 1, "r_CC", this),
|
||||
new Among ( "arity", 276, 1, "r_B", this),
|
||||
new Among ( "ivity", 276, 1, "r_A", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "s'", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "a", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "ia", 1, 1, "r_A", methodObject ),
|
||||
new Among ( "ata", 1, 1, "r_A", methodObject ),
|
||||
new Among ( "ic", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "aic", 4, 1, "r_A", methodObject ),
|
||||
new Among ( "allic", 4, 1, "r_BB", methodObject ),
|
||||
new Among ( "aric", 4, 1, "r_A", methodObject ),
|
||||
new Among ( "atic", 4, 1, "r_B", methodObject ),
|
||||
new Among ( "itic", 4, 1, "r_H", methodObject ),
|
||||
new Among ( "antic", 4, 1, "r_C", methodObject ),
|
||||
new Among ( "istic", 4, 1, "r_A", methodObject ),
|
||||
new Among ( "alistic", 11, 1, "r_B", methodObject ),
|
||||
new Among ( "aristic", 11, 1, "r_A", methodObject ),
|
||||
new Among ( "ivistic", 11, 1, "r_A", methodObject ),
|
||||
new Among ( "ed", -1, 1, "r_E", methodObject ),
|
||||
new Among ( "anced", 15, 1, "r_B", methodObject ),
|
||||
new Among ( "enced", 15, 1, "r_A", methodObject ),
|
||||
new Among ( "ished", 15, 1, "r_A", methodObject ),
|
||||
new Among ( "ied", 15, 1, "r_A", methodObject ),
|
||||
new Among ( "ened", 15, 1, "r_E", methodObject ),
|
||||
new Among ( "ioned", 15, 1, "r_A", methodObject ),
|
||||
new Among ( "ated", 15, 1, "r_I", methodObject ),
|
||||
new Among ( "ented", 15, 1, "r_C", methodObject ),
|
||||
new Among ( "ized", 15, 1, "r_F", methodObject ),
|
||||
new Among ( "arized", 24, 1, "r_A", methodObject ),
|
||||
new Among ( "oid", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "aroid", 26, 1, "r_A", methodObject ),
|
||||
new Among ( "hood", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "ehood", 28, 1, "r_A", methodObject ),
|
||||
new Among ( "ihood", 28, 1, "r_A", methodObject ),
|
||||
new Among ( "elihood", 30, 1, "r_E", methodObject ),
|
||||
new Among ( "ward", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "e", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "ae", 33, 1, "r_A", methodObject ),
|
||||
new Among ( "ance", 33, 1, "r_B", methodObject ),
|
||||
new Among ( "icance", 35, 1, "r_A", methodObject ),
|
||||
new Among ( "ence", 33, 1, "r_A", methodObject ),
|
||||
new Among ( "ide", 33, 1, "r_L", methodObject ),
|
||||
new Among ( "icide", 38, 1, "r_A", methodObject ),
|
||||
new Among ( "otide", 38, 1, "r_A", methodObject ),
|
||||
new Among ( "age", 33, 1, "r_B", methodObject ),
|
||||
new Among ( "able", 33, 1, "r_A", methodObject ),
|
||||
new Among ( "atable", 42, 1, "r_A", methodObject ),
|
||||
new Among ( "izable", 42, 1, "r_E", methodObject ),
|
||||
new Among ( "arizable", 44, 1, "r_A", methodObject ),
|
||||
new Among ( "ible", 33, 1, "r_A", methodObject ),
|
||||
new Among ( "encible", 46, 1, "r_A", methodObject ),
|
||||
new Among ( "ene", 33, 1, "r_E", methodObject ),
|
||||
new Among ( "ine", 33, 1, "r_M", methodObject ),
|
||||
new Among ( "idine", 49, 1, "r_I", methodObject ),
|
||||
new Among ( "one", 33, 1, "r_R", methodObject ),
|
||||
new Among ( "ature", 33, 1, "r_E", methodObject ),
|
||||
new Among ( "eature", 52, 1, "r_Z", methodObject ),
|
||||
new Among ( "ese", 33, 1, "r_A", methodObject ),
|
||||
new Among ( "wise", 33, 1, "r_A", methodObject ),
|
||||
new Among ( "ate", 33, 1, "r_A", methodObject ),
|
||||
new Among ( "entiate", 56, 1, "r_A", methodObject ),
|
||||
new Among ( "inate", 56, 1, "r_A", methodObject ),
|
||||
new Among ( "ionate", 56, 1, "r_D", methodObject ),
|
||||
new Among ( "ite", 33, 1, "r_AA", methodObject ),
|
||||
new Among ( "ive", 33, 1, "r_A", methodObject ),
|
||||
new Among ( "ative", 61, 1, "r_A", methodObject ),
|
||||
new Among ( "ize", 33, 1, "r_F", methodObject ),
|
||||
new Among ( "alize", 63, 1, "r_A", methodObject ),
|
||||
new Among ( "icalize", 64, 1, "r_A", methodObject ),
|
||||
new Among ( "ialize", 64, 1, "r_A", methodObject ),
|
||||
new Among ( "entialize", 66, 1, "r_A", methodObject ),
|
||||
new Among ( "ionalize", 64, 1, "r_A", methodObject ),
|
||||
new Among ( "arize", 63, 1, "r_A", methodObject ),
|
||||
new Among ( "ing", -1, 1, "r_N", methodObject ),
|
||||
new Among ( "ancing", 70, 1, "r_B", methodObject ),
|
||||
new Among ( "encing", 70, 1, "r_A", methodObject ),
|
||||
new Among ( "aging", 70, 1, "r_B", methodObject ),
|
||||
new Among ( "ening", 70, 1, "r_E", methodObject ),
|
||||
new Among ( "ioning", 70, 1, "r_A", methodObject ),
|
||||
new Among ( "ating", 70, 1, "r_I", methodObject ),
|
||||
new Among ( "enting", 70, 1, "r_C", methodObject ),
|
||||
new Among ( "ying", 70, 1, "r_B", methodObject ),
|
||||
new Among ( "izing", 70, 1, "r_F", methodObject ),
|
||||
new Among ( "arizing", 79, 1, "r_A", methodObject ),
|
||||
new Among ( "ish", -1, 1, "r_C", methodObject ),
|
||||
new Among ( "yish", 81, 1, "r_A", methodObject ),
|
||||
new Among ( "i", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "al", -1, 1, "r_BB", methodObject ),
|
||||
new Among ( "ical", 84, 1, "r_A", methodObject ),
|
||||
new Among ( "aical", 85, 1, "r_A", methodObject ),
|
||||
new Among ( "istical", 85, 1, "r_A", methodObject ),
|
||||
new Among ( "oidal", 84, 1, "r_A", methodObject ),
|
||||
new Among ( "eal", 84, 1, "r_Y", methodObject ),
|
||||
new Among ( "ial", 84, 1, "r_A", methodObject ),
|
||||
new Among ( "ancial", 90, 1, "r_A", methodObject ),
|
||||
new Among ( "arial", 90, 1, "r_A", methodObject ),
|
||||
new Among ( "ential", 90, 1, "r_A", methodObject ),
|
||||
new Among ( "ional", 84, 1, "r_A", methodObject ),
|
||||
new Among ( "ational", 94, 1, "r_B", methodObject ),
|
||||
new Among ( "izational", 95, 1, "r_A", methodObject ),
|
||||
new Among ( "ental", 84, 1, "r_A", methodObject ),
|
||||
new Among ( "ful", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "eful", 98, 1, "r_A", methodObject ),
|
||||
new Among ( "iful", 98, 1, "r_A", methodObject ),
|
||||
new Among ( "yl", -1, 1, "r_R", methodObject ),
|
||||
new Among ( "ism", -1, 1, "r_B", methodObject ),
|
||||
new Among ( "icism", 102, 1, "r_A", methodObject ),
|
||||
new Among ( "oidism", 102, 1, "r_A", methodObject ),
|
||||
new Among ( "alism", 102, 1, "r_B", methodObject ),
|
||||
new Among ( "icalism", 105, 1, "r_A", methodObject ),
|
||||
new Among ( "ionalism", 105, 1, "r_A", methodObject ),
|
||||
new Among ( "inism", 102, 1, "r_J", methodObject ),
|
||||
new Among ( "ativism", 102, 1, "r_A", methodObject ),
|
||||
new Among ( "um", -1, 1, "r_U", methodObject ),
|
||||
new Among ( "ium", 110, 1, "r_A", methodObject ),
|
||||
new Among ( "ian", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "ician", 112, 1, "r_A", methodObject ),
|
||||
new Among ( "en", -1, 1, "r_F", methodObject ),
|
||||
new Among ( "ogen", 114, 1, "r_A", methodObject ),
|
||||
new Among ( "on", -1, 1, "r_S", methodObject ),
|
||||
new Among ( "ion", 116, 1, "r_Q", methodObject ),
|
||||
new Among ( "ation", 117, 1, "r_B", methodObject ),
|
||||
new Among ( "ication", 118, 1, "r_G", methodObject ),
|
||||
new Among ( "entiation", 118, 1, "r_A", methodObject ),
|
||||
new Among ( "ination", 118, 1, "r_A", methodObject ),
|
||||
new Among ( "isation", 118, 1, "r_A", methodObject ),
|
||||
new Among ( "arisation", 122, 1, "r_A", methodObject ),
|
||||
new Among ( "entation", 118, 1, "r_A", methodObject ),
|
||||
new Among ( "ization", 118, 1, "r_F", methodObject ),
|
||||
new Among ( "arization", 125, 1, "r_A", methodObject ),
|
||||
new Among ( "action", 117, 1, "r_G", methodObject ),
|
||||
new Among ( "o", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "ar", -1, 1, "r_X", methodObject ),
|
||||
new Among ( "ear", 129, 1, "r_Y", methodObject ),
|
||||
new Among ( "ier", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "ariser", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "izer", -1, 1, "r_F", methodObject ),
|
||||
new Among ( "arizer", 133, 1, "r_A", methodObject ),
|
||||
new Among ( "or", -1, 1, "r_T", methodObject ),
|
||||
new Among ( "ator", 135, 1, "r_A", methodObject ),
|
||||
new Among ( "s", -1, 1, "r_W", methodObject ),
|
||||
new Among ( "'s", 137, 1, "r_A", methodObject ),
|
||||
new Among ( "as", 137, 1, "r_B", methodObject ),
|
||||
new Among ( "ics", 137, 1, "r_A", methodObject ),
|
||||
new Among ( "istics", 140, 1, "r_A", methodObject ),
|
||||
new Among ( "es", 137, 1, "r_E", methodObject ),
|
||||
new Among ( "ances", 142, 1, "r_B", methodObject ),
|
||||
new Among ( "ences", 142, 1, "r_A", methodObject ),
|
||||
new Among ( "ides", 142, 1, "r_L", methodObject ),
|
||||
new Among ( "oides", 145, 1, "r_A", methodObject ),
|
||||
new Among ( "ages", 142, 1, "r_B", methodObject ),
|
||||
new Among ( "ies", 142, 1, "r_P", methodObject ),
|
||||
new Among ( "acies", 148, 1, "r_A", methodObject ),
|
||||
new Among ( "ancies", 148, 1, "r_A", methodObject ),
|
||||
new Among ( "encies", 148, 1, "r_A", methodObject ),
|
||||
new Among ( "aries", 148, 1, "r_A", methodObject ),
|
||||
new Among ( "ities", 148, 1, "r_A", methodObject ),
|
||||
new Among ( "alities", 153, 1, "r_A", methodObject ),
|
||||
new Among ( "ivities", 153, 1, "r_A", methodObject ),
|
||||
new Among ( "ines", 142, 1, "r_M", methodObject ),
|
||||
new Among ( "nesses", 142, 1, "r_A", methodObject ),
|
||||
new Among ( "ates", 142, 1, "r_A", methodObject ),
|
||||
new Among ( "atives", 142, 1, "r_A", methodObject ),
|
||||
new Among ( "ings", 137, 1, "r_N", methodObject ),
|
||||
new Among ( "is", 137, 1, "r_A", methodObject ),
|
||||
new Among ( "als", 137, 1, "r_BB", methodObject ),
|
||||
new Among ( "ials", 162, 1, "r_A", methodObject ),
|
||||
new Among ( "entials", 163, 1, "r_A", methodObject ),
|
||||
new Among ( "ionals", 162, 1, "r_A", methodObject ),
|
||||
new Among ( "isms", 137, 1, "r_B", methodObject ),
|
||||
new Among ( "ians", 137, 1, "r_A", methodObject ),
|
||||
new Among ( "icians", 167, 1, "r_A", methodObject ),
|
||||
new Among ( "ions", 137, 1, "r_B", methodObject ),
|
||||
new Among ( "ations", 169, 1, "r_B", methodObject ),
|
||||
new Among ( "arisations", 170, 1, "r_A", methodObject ),
|
||||
new Among ( "entations", 170, 1, "r_A", methodObject ),
|
||||
new Among ( "izations", 170, 1, "r_A", methodObject ),
|
||||
new Among ( "arizations", 173, 1, "r_A", methodObject ),
|
||||
new Among ( "ars", 137, 1, "r_O", methodObject ),
|
||||
new Among ( "iers", 137, 1, "r_A", methodObject ),
|
||||
new Among ( "izers", 137, 1, "r_F", methodObject ),
|
||||
new Among ( "ators", 137, 1, "r_A", methodObject ),
|
||||
new Among ( "less", 137, 1, "r_A", methodObject ),
|
||||
new Among ( "eless", 179, 1, "r_A", methodObject ),
|
||||
new Among ( "ness", 137, 1, "r_A", methodObject ),
|
||||
new Among ( "eness", 181, 1, "r_E", methodObject ),
|
||||
new Among ( "ableness", 182, 1, "r_A", methodObject ),
|
||||
new Among ( "eableness", 183, 1, "r_E", methodObject ),
|
||||
new Among ( "ibleness", 182, 1, "r_A", methodObject ),
|
||||
new Among ( "ateness", 182, 1, "r_A", methodObject ),
|
||||
new Among ( "iteness", 182, 1, "r_A", methodObject ),
|
||||
new Among ( "iveness", 182, 1, "r_A", methodObject ),
|
||||
new Among ( "ativeness", 188, 1, "r_A", methodObject ),
|
||||
new Among ( "ingness", 181, 1, "r_A", methodObject ),
|
||||
new Among ( "ishness", 181, 1, "r_A", methodObject ),
|
||||
new Among ( "iness", 181, 1, "r_A", methodObject ),
|
||||
new Among ( "ariness", 192, 1, "r_E", methodObject ),
|
||||
new Among ( "alness", 181, 1, "r_A", methodObject ),
|
||||
new Among ( "icalness", 194, 1, "r_A", methodObject ),
|
||||
new Among ( "antialness", 194, 1, "r_A", methodObject ),
|
||||
new Among ( "entialness", 194, 1, "r_A", methodObject ),
|
||||
new Among ( "ionalness", 194, 1, "r_A", methodObject ),
|
||||
new Among ( "fulness", 181, 1, "r_A", methodObject ),
|
||||
new Among ( "lessness", 181, 1, "r_A", methodObject ),
|
||||
new Among ( "ousness", 181, 1, "r_A", methodObject ),
|
||||
new Among ( "eousness", 201, 1, "r_A", methodObject ),
|
||||
new Among ( "iousness", 201, 1, "r_A", methodObject ),
|
||||
new Among ( "itousness", 201, 1, "r_A", methodObject ),
|
||||
new Among ( "entness", 181, 1, "r_A", methodObject ),
|
||||
new Among ( "ants", 137, 1, "r_B", methodObject ),
|
||||
new Among ( "ists", 137, 1, "r_A", methodObject ),
|
||||
new Among ( "icists", 207, 1, "r_A", methodObject ),
|
||||
new Among ( "us", 137, 1, "r_V", methodObject ),
|
||||
new Among ( "ous", 209, 1, "r_A", methodObject ),
|
||||
new Among ( "eous", 210, 1, "r_A", methodObject ),
|
||||
new Among ( "aceous", 211, 1, "r_A", methodObject ),
|
||||
new Among ( "antaneous", 211, 1, "r_A", methodObject ),
|
||||
new Among ( "ious", 210, 1, "r_A", methodObject ),
|
||||
new Among ( "acious", 214, 1, "r_B", methodObject ),
|
||||
new Among ( "itous", 210, 1, "r_A", methodObject ),
|
||||
new Among ( "ant", -1, 1, "r_B", methodObject ),
|
||||
new Among ( "icant", 217, 1, "r_A", methodObject ),
|
||||
new Among ( "ent", -1, 1, "r_C", methodObject ),
|
||||
new Among ( "ement", 219, 1, "r_A", methodObject ),
|
||||
new Among ( "izement", 220, 1, "r_A", methodObject ),
|
||||
new Among ( "ist", -1, 1, "r_A", methodObject ),
|
||||
new Among ( "icist", 222, 1, "r_A", methodObject ),
|
||||
new Among ( "alist", 222, 1, "r_A", methodObject ),
|
||||
new Among ( "icalist", 224, 1, "r_A", methodObject ),
|
||||
new Among ( "ialist", 224, 1, "r_A", methodObject ),
|
||||
new Among ( "ionist", 222, 1, "r_A", methodObject ),
|
||||
new Among ( "entist", 222, 1, "r_A", methodObject ),
|
||||
new Among ( "y", -1, 1, "r_B", methodObject ),
|
||||
new Among ( "acy", 229, 1, "r_A", methodObject ),
|
||||
new Among ( "ancy", 229, 1, "r_B", methodObject ),
|
||||
new Among ( "ency", 229, 1, "r_A", methodObject ),
|
||||
new Among ( "ly", 229, 1, "r_B", methodObject ),
|
||||
new Among ( "ealy", 233, 1, "r_Y", methodObject ),
|
||||
new Among ( "ably", 233, 1, "r_A", methodObject ),
|
||||
new Among ( "ibly", 233, 1, "r_A", methodObject ),
|
||||
new Among ( "edly", 233, 1, "r_E", methodObject ),
|
||||
new Among ( "iedly", 237, 1, "r_A", methodObject ),
|
||||
new Among ( "ely", 233, 1, "r_E", methodObject ),
|
||||
new Among ( "ately", 239, 1, "r_A", methodObject ),
|
||||
new Among ( "ively", 239, 1, "r_A", methodObject ),
|
||||
new Among ( "atively", 241, 1, "r_A", methodObject ),
|
||||
new Among ( "ingly", 233, 1, "r_B", methodObject ),
|
||||
new Among ( "atingly", 243, 1, "r_A", methodObject ),
|
||||
new Among ( "ily", 233, 1, "r_A", methodObject ),
|
||||
new Among ( "lily", 245, 1, "r_A", methodObject ),
|
||||
new Among ( "arily", 245, 1, "r_A", methodObject ),
|
||||
new Among ( "ally", 233, 1, "r_B", methodObject ),
|
||||
new Among ( "ically", 248, 1, "r_A", methodObject ),
|
||||
new Among ( "aically", 249, 1, "r_A", methodObject ),
|
||||
new Among ( "allically", 249, 1, "r_C", methodObject ),
|
||||
new Among ( "istically", 249, 1, "r_A", methodObject ),
|
||||
new Among ( "alistically", 252, 1, "r_B", methodObject ),
|
||||
new Among ( "oidally", 248, 1, "r_A", methodObject ),
|
||||
new Among ( "ially", 248, 1, "r_A", methodObject ),
|
||||
new Among ( "entially", 255, 1, "r_A", methodObject ),
|
||||
new Among ( "ionally", 248, 1, "r_A", methodObject ),
|
||||
new Among ( "ationally", 257, 1, "r_B", methodObject ),
|
||||
new Among ( "izationally", 258, 1, "r_B", methodObject ),
|
||||
new Among ( "entally", 248, 1, "r_A", methodObject ),
|
||||
new Among ( "fully", 233, 1, "r_A", methodObject ),
|
||||
new Among ( "efully", 261, 1, "r_A", methodObject ),
|
||||
new Among ( "ifully", 261, 1, "r_A", methodObject ),
|
||||
new Among ( "enly", 233, 1, "r_E", methodObject ),
|
||||
new Among ( "arly", 233, 1, "r_K", methodObject ),
|
||||
new Among ( "early", 265, 1, "r_Y", methodObject ),
|
||||
new Among ( "lessly", 233, 1, "r_A", methodObject ),
|
||||
new Among ( "ously", 233, 1, "r_A", methodObject ),
|
||||
new Among ( "eously", 268, 1, "r_A", methodObject ),
|
||||
new Among ( "iously", 268, 1, "r_A", methodObject ),
|
||||
new Among ( "ently", 233, 1, "r_A", methodObject ),
|
||||
new Among ( "ary", 229, 1, "r_F", methodObject ),
|
||||
new Among ( "ery", 229, 1, "r_E", methodObject ),
|
||||
new Among ( "icianry", 229, 1, "r_A", methodObject ),
|
||||
new Among ( "atory", 229, 1, "r_A", methodObject ),
|
||||
new Among ( "ity", 229, 1, "r_A", methodObject ),
|
||||
new Among ( "acity", 276, 1, "r_A", methodObject ),
|
||||
new Among ( "icity", 276, 1, "r_A", methodObject ),
|
||||
new Among ( "eity", 276, 1, "r_A", methodObject ),
|
||||
new Among ( "ality", 276, 1, "r_A", methodObject ),
|
||||
new Among ( "icality", 280, 1, "r_A", methodObject ),
|
||||
new Among ( "iality", 280, 1, "r_A", methodObject ),
|
||||
new Among ( "antiality", 282, 1, "r_A", methodObject ),
|
||||
new Among ( "entiality", 282, 1, "r_A", methodObject ),
|
||||
new Among ( "ionality", 280, 1, "r_A", methodObject ),
|
||||
new Among ( "elity", 276, 1, "r_A", methodObject ),
|
||||
new Among ( "ability", 276, 1, "r_A", methodObject ),
|
||||
new Among ( "izability", 287, 1, "r_A", methodObject ),
|
||||
new Among ( "arizability", 288, 1, "r_A", methodObject ),
|
||||
new Among ( "ibility", 276, 1, "r_A", methodObject ),
|
||||
new Among ( "inity", 276, 1, "r_CC", methodObject ),
|
||||
new Among ( "arity", 276, 1, "r_B", methodObject ),
|
||||
new Among ( "ivity", 276, 1, "r_A", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "bb", -1, -1, "", this),
|
||||
new Among ( "dd", -1, -1, "", this),
|
||||
new Among ( "gg", -1, -1, "", this),
|
||||
new Among ( "ll", -1, -1, "", this),
|
||||
new Among ( "mm", -1, -1, "", this),
|
||||
new Among ( "nn", -1, -1, "", this),
|
||||
new Among ( "pp", -1, -1, "", this),
|
||||
new Among ( "rr", -1, -1, "", this),
|
||||
new Among ( "ss", -1, -1, "", this),
|
||||
new Among ( "tt", -1, -1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "bb", -1, -1, "", methodObject ),
|
||||
new Among ( "dd", -1, -1, "", methodObject ),
|
||||
new Among ( "gg", -1, -1, "", methodObject ),
|
||||
new Among ( "ll", -1, -1, "", methodObject ),
|
||||
new Among ( "mm", -1, -1, "", methodObject ),
|
||||
new Among ( "nn", -1, -1, "", methodObject ),
|
||||
new Among ( "pp", -1, -1, "", methodObject ),
|
||||
new Among ( "rr", -1, -1, "", methodObject ),
|
||||
new Among ( "ss", -1, -1, "", methodObject ),
|
||||
new Among ( "tt", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "uad", -1, 18, "", this),
|
||||
new Among ( "vad", -1, 19, "", this),
|
||||
new Among ( "cid", -1, 20, "", this),
|
||||
new Among ( "lid", -1, 21, "", this),
|
||||
new Among ( "erid", -1, 22, "", this),
|
||||
new Among ( "pand", -1, 23, "", this),
|
||||
new Among ( "end", -1, 24, "", this),
|
||||
new Among ( "ond", -1, 25, "", this),
|
||||
new Among ( "lud", -1, 26, "", this),
|
||||
new Among ( "rud", -1, 27, "", this),
|
||||
new Among ( "ul", -1, 9, "", this),
|
||||
new Among ( "her", -1, 28, "", this),
|
||||
new Among ( "metr", -1, 7, "", this),
|
||||
new Among ( "istr", -1, 6, "", this),
|
||||
new Among ( "urs", -1, 5, "", this),
|
||||
new Among ( "uct", -1, 2, "", this),
|
||||
new Among ( "et", -1, 32, "", this),
|
||||
new Among ( "mit", -1, 29, "", this),
|
||||
new Among ( "ent", -1, 30, "", this),
|
||||
new Among ( "umpt", -1, 3, "", this),
|
||||
new Among ( "rpt", -1, 4, "", this),
|
||||
new Among ( "ert", -1, 31, "", this),
|
||||
new Among ( "yt", -1, 33, "", this),
|
||||
new Among ( "iev", -1, 1, "", this),
|
||||
new Among ( "olv", -1, 8, "", this),
|
||||
new Among ( "ax", -1, 14, "", this),
|
||||
new Among ( "ex", -1, 15, "", this),
|
||||
new Among ( "bex", 26, 10, "", this),
|
||||
new Among ( "dex", 26, 11, "", this),
|
||||
new Among ( "pex", 26, 12, "", this),
|
||||
new Among ( "tex", 26, 13, "", this),
|
||||
new Among ( "ix", -1, 16, "", this),
|
||||
new Among ( "lux", -1, 17, "", this),
|
||||
new Among ( "yz", -1, 34, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "uad", -1, 18, "", methodObject ),
|
||||
new Among ( "vad", -1, 19, "", methodObject ),
|
||||
new Among ( "cid", -1, 20, "", methodObject ),
|
||||
new Among ( "lid", -1, 21, "", methodObject ),
|
||||
new Among ( "erid", -1, 22, "", methodObject ),
|
||||
new Among ( "pand", -1, 23, "", methodObject ),
|
||||
new Among ( "end", -1, 24, "", methodObject ),
|
||||
new Among ( "ond", -1, 25, "", methodObject ),
|
||||
new Among ( "lud", -1, 26, "", methodObject ),
|
||||
new Among ( "rud", -1, 27, "", methodObject ),
|
||||
new Among ( "ul", -1, 9, "", methodObject ),
|
||||
new Among ( "her", -1, 28, "", methodObject ),
|
||||
new Among ( "metr", -1, 7, "", methodObject ),
|
||||
new Among ( "istr", -1, 6, "", methodObject ),
|
||||
new Among ( "urs", -1, 5, "", methodObject ),
|
||||
new Among ( "uct", -1, 2, "", methodObject ),
|
||||
new Among ( "et", -1, 32, "", methodObject ),
|
||||
new Among ( "mit", -1, 29, "", methodObject ),
|
||||
new Among ( "ent", -1, 30, "", methodObject ),
|
||||
new Among ( "umpt", -1, 3, "", methodObject ),
|
||||
new Among ( "rpt", -1, 4, "", methodObject ),
|
||||
new Among ( "ert", -1, 31, "", methodObject ),
|
||||
new Among ( "yt", -1, 33, "", methodObject ),
|
||||
new Among ( "iev", -1, 1, "", methodObject ),
|
||||
new Among ( "olv", -1, 8, "", methodObject ),
|
||||
new Among ( "ax", -1, 14, "", methodObject ),
|
||||
new Among ( "ex", -1, 15, "", methodObject ),
|
||||
new Among ( "bex", 26, 10, "", methodObject ),
|
||||
new Among ( "dex", 26, 11, "", methodObject ),
|
||||
new Among ( "pex", 26, 12, "", methodObject ),
|
||||
new Among ( "tex", 26, 13, "", methodObject ),
|
||||
new Among ( "ix", -1, 16, "", methodObject ),
|
||||
new Among ( "lux", -1, 17, "", methodObject ),
|
||||
new Among ( "yz", -1, 34, "", methodObject )
|
||||
};
|
||||
|
||||
|
||||
|
@ -1904,5 +1911,15 @@ public class LovinsStemmer extends SnowballProgram {
|
|||
cursor = limit_backward; return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof LovinsStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return LovinsStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,63 +1,70 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class NorwegianStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "a", -1, 1, "", this),
|
||||
new Among ( "e", -1, 1, "", this),
|
||||
new Among ( "ede", 1, 1, "", this),
|
||||
new Among ( "ande", 1, 1, "", this),
|
||||
new Among ( "ende", 1, 1, "", this),
|
||||
new Among ( "ane", 1, 1, "", this),
|
||||
new Among ( "ene", 1, 1, "", this),
|
||||
new Among ( "hetene", 6, 1, "", this),
|
||||
new Among ( "erte", 1, 3, "", this),
|
||||
new Among ( "en", -1, 1, "", this),
|
||||
new Among ( "heten", 9, 1, "", this),
|
||||
new Among ( "ar", -1, 1, "", this),
|
||||
new Among ( "er", -1, 1, "", this),
|
||||
new Among ( "heter", 12, 1, "", this),
|
||||
new Among ( "s", -1, 2, "", this),
|
||||
new Among ( "as", 14, 1, "", this),
|
||||
new Among ( "es", 14, 1, "", this),
|
||||
new Among ( "edes", 16, 1, "", this),
|
||||
new Among ( "endes", 16, 1, "", this),
|
||||
new Among ( "enes", 16, 1, "", this),
|
||||
new Among ( "hetenes", 19, 1, "", this),
|
||||
new Among ( "ens", 14, 1, "", this),
|
||||
new Among ( "hetens", 21, 1, "", this),
|
||||
new Among ( "ers", 14, 1, "", this),
|
||||
new Among ( "ets", 14, 1, "", this),
|
||||
new Among ( "et", -1, 1, "", this),
|
||||
new Among ( "het", 25, 1, "", this),
|
||||
new Among ( "ert", -1, 3, "", this),
|
||||
new Among ( "ast", -1, 1, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static NorwegianStemmer methodObject = new NorwegianStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "a", -1, 1, "", methodObject ),
|
||||
new Among ( "e", -1, 1, "", methodObject ),
|
||||
new Among ( "ede", 1, 1, "", methodObject ),
|
||||
new Among ( "ande", 1, 1, "", methodObject ),
|
||||
new Among ( "ende", 1, 1, "", methodObject ),
|
||||
new Among ( "ane", 1, 1, "", methodObject ),
|
||||
new Among ( "ene", 1, 1, "", methodObject ),
|
||||
new Among ( "hetene", 6, 1, "", methodObject ),
|
||||
new Among ( "erte", 1, 3, "", methodObject ),
|
||||
new Among ( "en", -1, 1, "", methodObject ),
|
||||
new Among ( "heten", 9, 1, "", methodObject ),
|
||||
new Among ( "ar", -1, 1, "", methodObject ),
|
||||
new Among ( "er", -1, 1, "", methodObject ),
|
||||
new Among ( "heter", 12, 1, "", methodObject ),
|
||||
new Among ( "s", -1, 2, "", methodObject ),
|
||||
new Among ( "as", 14, 1, "", methodObject ),
|
||||
new Among ( "es", 14, 1, "", methodObject ),
|
||||
new Among ( "edes", 16, 1, "", methodObject ),
|
||||
new Among ( "endes", 16, 1, "", methodObject ),
|
||||
new Among ( "enes", 16, 1, "", methodObject ),
|
||||
new Among ( "hetenes", 19, 1, "", methodObject ),
|
||||
new Among ( "ens", 14, 1, "", methodObject ),
|
||||
new Among ( "hetens", 21, 1, "", methodObject ),
|
||||
new Among ( "ers", 14, 1, "", methodObject ),
|
||||
new Among ( "ets", 14, 1, "", methodObject ),
|
||||
new Among ( "et", -1, 1, "", methodObject ),
|
||||
new Among ( "het", 25, 1, "", methodObject ),
|
||||
new Among ( "ert", -1, 3, "", methodObject ),
|
||||
new Among ( "ast", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "dt", -1, -1, "", this),
|
||||
new Among ( "vt", -1, -1, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "dt", -1, -1, "", methodObject ),
|
||||
new Among ( "vt", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "leg", -1, 1, "", this),
|
||||
new Among ( "eleg", 0, 1, "", this),
|
||||
new Among ( "ig", -1, 1, "", this),
|
||||
new Among ( "eig", 2, 1, "", this),
|
||||
new Among ( "lig", 2, 1, "", this),
|
||||
new Among ( "elig", 4, 1, "", this),
|
||||
new Among ( "els", -1, 1, "", this),
|
||||
new Among ( "lov", -1, 1, "", this),
|
||||
new Among ( "elov", 7, 1, "", this),
|
||||
new Among ( "slov", 7, 1, "", this),
|
||||
new Among ( "hetslov", 9, 1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "leg", -1, 1, "", methodObject ),
|
||||
new Among ( "eleg", 0, 1, "", methodObject ),
|
||||
new Among ( "ig", -1, 1, "", methodObject ),
|
||||
new Among ( "eig", 2, 1, "", methodObject ),
|
||||
new Among ( "lig", 2, 1, "", methodObject ),
|
||||
new Among ( "elig", 4, 1, "", methodObject ),
|
||||
new Among ( "els", -1, 1, "", methodObject ),
|
||||
new Among ( "lov", -1, 1, "", methodObject ),
|
||||
new Among ( "elov", 7, 1, "", methodObject ),
|
||||
new Among ( "slov", 7, 1, "", methodObject ),
|
||||
new Among ( "hetslov", 9, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 48, 0, 128 };
|
||||
|
@ -354,5 +361,15 @@ public class NorwegianStemmer extends SnowballProgram {
|
|||
cursor = limit_backward; return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof NorwegianStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return NorwegianStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,96 +1,103 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class PorterStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "s", -1, 3, "", this),
|
||||
new Among ( "ies", 0, 2, "", this),
|
||||
new Among ( "sses", 0, 1, "", this),
|
||||
new Among ( "ss", 0, -1, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static PorterStemmer methodObject = new PorterStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "s", -1, 3, "", methodObject ),
|
||||
new Among ( "ies", 0, 2, "", methodObject ),
|
||||
new Among ( "sses", 0, 1, "", methodObject ),
|
||||
new Among ( "ss", 0, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "", -1, 3, "", this),
|
||||
new Among ( "bb", 0, 2, "", this),
|
||||
new Among ( "dd", 0, 2, "", this),
|
||||
new Among ( "ff", 0, 2, "", this),
|
||||
new Among ( "gg", 0, 2, "", this),
|
||||
new Among ( "bl", 0, 1, "", this),
|
||||
new Among ( "mm", 0, 2, "", this),
|
||||
new Among ( "nn", 0, 2, "", this),
|
||||
new Among ( "pp", 0, 2, "", this),
|
||||
new Among ( "rr", 0, 2, "", this),
|
||||
new Among ( "at", 0, 1, "", this),
|
||||
new Among ( "tt", 0, 2, "", this),
|
||||
new Among ( "iz", 0, 1, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "", -1, 3, "", methodObject ),
|
||||
new Among ( "bb", 0, 2, "", methodObject ),
|
||||
new Among ( "dd", 0, 2, "", methodObject ),
|
||||
new Among ( "ff", 0, 2, "", methodObject ),
|
||||
new Among ( "gg", 0, 2, "", methodObject ),
|
||||
new Among ( "bl", 0, 1, "", methodObject ),
|
||||
new Among ( "mm", 0, 2, "", methodObject ),
|
||||
new Among ( "nn", 0, 2, "", methodObject ),
|
||||
new Among ( "pp", 0, 2, "", methodObject ),
|
||||
new Among ( "rr", 0, 2, "", methodObject ),
|
||||
new Among ( "at", 0, 1, "", methodObject ),
|
||||
new Among ( "tt", 0, 2, "", methodObject ),
|
||||
new Among ( "iz", 0, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "ed", -1, 2, "", this),
|
||||
new Among ( "eed", 0, 1, "", this),
|
||||
new Among ( "ing", -1, 2, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "ed", -1, 2, "", methodObject ),
|
||||
new Among ( "eed", 0, 1, "", methodObject ),
|
||||
new Among ( "ing", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "anci", -1, 3, "", this),
|
||||
new Among ( "enci", -1, 2, "", this),
|
||||
new Among ( "abli", -1, 4, "", this),
|
||||
new Among ( "eli", -1, 6, "", this),
|
||||
new Among ( "alli", -1, 9, "", this),
|
||||
new Among ( "ousli", -1, 12, "", this),
|
||||
new Among ( "entli", -1, 5, "", this),
|
||||
new Among ( "aliti", -1, 10, "", this),
|
||||
new Among ( "biliti", -1, 14, "", this),
|
||||
new Among ( "iviti", -1, 13, "", this),
|
||||
new Among ( "tional", -1, 1, "", this),
|
||||
new Among ( "ational", 10, 8, "", this),
|
||||
new Among ( "alism", -1, 10, "", this),
|
||||
new Among ( "ation", -1, 8, "", this),
|
||||
new Among ( "ization", 13, 7, "", this),
|
||||
new Among ( "izer", -1, 7, "", this),
|
||||
new Among ( "ator", -1, 8, "", this),
|
||||
new Among ( "iveness", -1, 13, "", this),
|
||||
new Among ( "fulness", -1, 11, "", this),
|
||||
new Among ( "ousness", -1, 12, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "anci", -1, 3, "", methodObject ),
|
||||
new Among ( "enci", -1, 2, "", methodObject ),
|
||||
new Among ( "abli", -1, 4, "", methodObject ),
|
||||
new Among ( "eli", -1, 6, "", methodObject ),
|
||||
new Among ( "alli", -1, 9, "", methodObject ),
|
||||
new Among ( "ousli", -1, 12, "", methodObject ),
|
||||
new Among ( "entli", -1, 5, "", methodObject ),
|
||||
new Among ( "aliti", -1, 10, "", methodObject ),
|
||||
new Among ( "biliti", -1, 14, "", methodObject ),
|
||||
new Among ( "iviti", -1, 13, "", methodObject ),
|
||||
new Among ( "tional", -1, 1, "", methodObject ),
|
||||
new Among ( "ational", 10, 8, "", methodObject ),
|
||||
new Among ( "alism", -1, 10, "", methodObject ),
|
||||
new Among ( "ation", -1, 8, "", methodObject ),
|
||||
new Among ( "ization", 13, 7, "", methodObject ),
|
||||
new Among ( "izer", -1, 7, "", methodObject ),
|
||||
new Among ( "ator", -1, 8, "", methodObject ),
|
||||
new Among ( "iveness", -1, 13, "", methodObject ),
|
||||
new Among ( "fulness", -1, 11, "", methodObject ),
|
||||
new Among ( "ousness", -1, 12, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "icate", -1, 2, "", this),
|
||||
new Among ( "ative", -1, 3, "", this),
|
||||
new Among ( "alize", -1, 1, "", this),
|
||||
new Among ( "iciti", -1, 2, "", this),
|
||||
new Among ( "ical", -1, 2, "", this),
|
||||
new Among ( "ful", -1, 3, "", this),
|
||||
new Among ( "ness", -1, 3, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "icate", -1, 2, "", methodObject ),
|
||||
new Among ( "ative", -1, 3, "", methodObject ),
|
||||
new Among ( "alize", -1, 1, "", methodObject ),
|
||||
new Among ( "iciti", -1, 2, "", methodObject ),
|
||||
new Among ( "ical", -1, 2, "", methodObject ),
|
||||
new Among ( "ful", -1, 3, "", methodObject ),
|
||||
new Among ( "ness", -1, 3, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "ic", -1, 1, "", this),
|
||||
new Among ( "ance", -1, 1, "", this),
|
||||
new Among ( "ence", -1, 1, "", this),
|
||||
new Among ( "able", -1, 1, "", this),
|
||||
new Among ( "ible", -1, 1, "", this),
|
||||
new Among ( "ate", -1, 1, "", this),
|
||||
new Among ( "ive", -1, 1, "", this),
|
||||
new Among ( "ize", -1, 1, "", this),
|
||||
new Among ( "iti", -1, 1, "", this),
|
||||
new Among ( "al", -1, 1, "", this),
|
||||
new Among ( "ism", -1, 1, "", this),
|
||||
new Among ( "ion", -1, 2, "", this),
|
||||
new Among ( "er", -1, 1, "", this),
|
||||
new Among ( "ous", -1, 1, "", this),
|
||||
new Among ( "ant", -1, 1, "", this),
|
||||
new Among ( "ent", -1, 1, "", this),
|
||||
new Among ( "ment", 15, 1, "", this),
|
||||
new Among ( "ement", 16, 1, "", this),
|
||||
new Among ( "ou", -1, 1, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "ic", -1, 1, "", methodObject ),
|
||||
new Among ( "ance", -1, 1, "", methodObject ),
|
||||
new Among ( "ence", -1, 1, "", methodObject ),
|
||||
new Among ( "able", -1, 1, "", methodObject ),
|
||||
new Among ( "ible", -1, 1, "", methodObject ),
|
||||
new Among ( "ate", -1, 1, "", methodObject ),
|
||||
new Among ( "ive", -1, 1, "", methodObject ),
|
||||
new Among ( "ize", -1, 1, "", methodObject ),
|
||||
new Among ( "iti", -1, 1, "", methodObject ),
|
||||
new Among ( "al", -1, 1, "", methodObject ),
|
||||
new Among ( "ism", -1, 1, "", methodObject ),
|
||||
new Among ( "ion", -1, 2, "", methodObject ),
|
||||
new Among ( "er", -1, 1, "", methodObject ),
|
||||
new Among ( "ous", -1, 1, "", methodObject ),
|
||||
new Among ( "ant", -1, 1, "", methodObject ),
|
||||
new Among ( "ent", -1, 1, "", methodObject ),
|
||||
new Among ( "ment", 15, 1, "", methodObject ),
|
||||
new Among ( "ement", 16, 1, "", methodObject ),
|
||||
new Among ( "ou", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 1 };
|
||||
|
@ -902,5 +909,15 @@ public class PorterStemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof PorterStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return PorterStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,231 +1,238 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class PortugueseStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "", -1, 3, "", this),
|
||||
new Among ( "\u00E3", 0, 1, "", this),
|
||||
new Among ( "\u00F5", 0, 2, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static PortugueseStemmer methodObject = new PortugueseStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "", -1, 3, "", methodObject ),
|
||||
new Among ( "\u00E3", 0, 1, "", methodObject ),
|
||||
new Among ( "\u00F5", 0, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "", -1, 3, "", this),
|
||||
new Among ( "a~", 0, 1, "", this),
|
||||
new Among ( "o~", 0, 2, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "", -1, 3, "", methodObject ),
|
||||
new Among ( "a~", 0, 1, "", methodObject ),
|
||||
new Among ( "o~", 0, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "ic", -1, -1, "", this),
|
||||
new Among ( "ad", -1, -1, "", this),
|
||||
new Among ( "os", -1, -1, "", this),
|
||||
new Among ( "iv", -1, 1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "ic", -1, -1, "", methodObject ),
|
||||
new Among ( "ad", -1, -1, "", methodObject ),
|
||||
new Among ( "os", -1, -1, "", methodObject ),
|
||||
new Among ( "iv", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "ante", -1, 1, "", this),
|
||||
new Among ( "avel", -1, 1, "", this),
|
||||
new Among ( "\u00EDvel", -1, 1, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "ante", -1, 1, "", methodObject ),
|
||||
new Among ( "avel", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00EDvel", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "ic", -1, 1, "", this),
|
||||
new Among ( "abil", -1, 1, "", this),
|
||||
new Among ( "iv", -1, 1, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "ic", -1, 1, "", methodObject ),
|
||||
new Among ( "abil", -1, 1, "", methodObject ),
|
||||
new Among ( "iv", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "ica", -1, 1, "", this),
|
||||
new Among ( "\u00E2ncia", -1, 1, "", this),
|
||||
new Among ( "\u00EAncia", -1, 4, "", this),
|
||||
new Among ( "ira", -1, 9, "", this),
|
||||
new Among ( "adora", -1, 1, "", this),
|
||||
new Among ( "osa", -1, 1, "", this),
|
||||
new Among ( "ista", -1, 1, "", this),
|
||||
new Among ( "iva", -1, 8, "", this),
|
||||
new Among ( "eza", -1, 1, "", this),
|
||||
new Among ( "log\u00EDa", -1, 2, "", this),
|
||||
new Among ( "idade", -1, 7, "", this),
|
||||
new Among ( "ante", -1, 1, "", this),
|
||||
new Among ( "mente", -1, 6, "", this),
|
||||
new Among ( "amente", 12, 5, "", this),
|
||||
new Among ( "\u00E1vel", -1, 1, "", this),
|
||||
new Among ( "\u00EDvel", -1, 1, "", this),
|
||||
new Among ( "uci\u00F3n", -1, 3, "", this),
|
||||
new Among ( "ico", -1, 1, "", this),
|
||||
new Among ( "ismo", -1, 1, "", this),
|
||||
new Among ( "oso", -1, 1, "", this),
|
||||
new Among ( "amento", -1, 1, "", this),
|
||||
new Among ( "imento", -1, 1, "", this),
|
||||
new Among ( "ivo", -1, 8, "", this),
|
||||
new Among ( "a\u00E7a~o", -1, 1, "", this),
|
||||
new Among ( "ador", -1, 1, "", this),
|
||||
new Among ( "icas", -1, 1, "", this),
|
||||
new Among ( "\u00EAncias", -1, 4, "", this),
|
||||
new Among ( "iras", -1, 9, "", this),
|
||||
new Among ( "adoras", -1, 1, "", this),
|
||||
new Among ( "osas", -1, 1, "", this),
|
||||
new Among ( "istas", -1, 1, "", this),
|
||||
new Among ( "ivas", -1, 8, "", this),
|
||||
new Among ( "ezas", -1, 1, "", this),
|
||||
new Among ( "log\u00EDas", -1, 2, "", this),
|
||||
new Among ( "idades", -1, 7, "", this),
|
||||
new Among ( "uciones", -1, 3, "", this),
|
||||
new Among ( "adores", -1, 1, "", this),
|
||||
new Among ( "antes", -1, 1, "", this),
|
||||
new Among ( "a\u00E7o~es", -1, 1, "", this),
|
||||
new Among ( "icos", -1, 1, "", this),
|
||||
new Among ( "ismos", -1, 1, "", this),
|
||||
new Among ( "osos", -1, 1, "", this),
|
||||
new Among ( "amentos", -1, 1, "", this),
|
||||
new Among ( "imentos", -1, 1, "", this),
|
||||
new Among ( "ivos", -1, 8, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "ica", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E2ncia", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00EAncia", -1, 4, "", methodObject ),
|
||||
new Among ( "ira", -1, 9, "", methodObject ),
|
||||
new Among ( "adora", -1, 1, "", methodObject ),
|
||||
new Among ( "osa", -1, 1, "", methodObject ),
|
||||
new Among ( "ista", -1, 1, "", methodObject ),
|
||||
new Among ( "iva", -1, 8, "", methodObject ),
|
||||
new Among ( "eza", -1, 1, "", methodObject ),
|
||||
new Among ( "log\u00EDa", -1, 2, "", methodObject ),
|
||||
new Among ( "idade", -1, 7, "", methodObject ),
|
||||
new Among ( "ante", -1, 1, "", methodObject ),
|
||||
new Among ( "mente", -1, 6, "", methodObject ),
|
||||
new Among ( "amente", 12, 5, "", methodObject ),
|
||||
new Among ( "\u00E1vel", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00EDvel", -1, 1, "", methodObject ),
|
||||
new Among ( "uci\u00F3n", -1, 3, "", methodObject ),
|
||||
new Among ( "ico", -1, 1, "", methodObject ),
|
||||
new Among ( "ismo", -1, 1, "", methodObject ),
|
||||
new Among ( "oso", -1, 1, "", methodObject ),
|
||||
new Among ( "amento", -1, 1, "", methodObject ),
|
||||
new Among ( "imento", -1, 1, "", methodObject ),
|
||||
new Among ( "ivo", -1, 8, "", methodObject ),
|
||||
new Among ( "a\u00E7a~o", -1, 1, "", methodObject ),
|
||||
new Among ( "ador", -1, 1, "", methodObject ),
|
||||
new Among ( "icas", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00EAncias", -1, 4, "", methodObject ),
|
||||
new Among ( "iras", -1, 9, "", methodObject ),
|
||||
new Among ( "adoras", -1, 1, "", methodObject ),
|
||||
new Among ( "osas", -1, 1, "", methodObject ),
|
||||
new Among ( "istas", -1, 1, "", methodObject ),
|
||||
new Among ( "ivas", -1, 8, "", methodObject ),
|
||||
new Among ( "ezas", -1, 1, "", methodObject ),
|
||||
new Among ( "log\u00EDas", -1, 2, "", methodObject ),
|
||||
new Among ( "idades", -1, 7, "", methodObject ),
|
||||
new Among ( "uciones", -1, 3, "", methodObject ),
|
||||
new Among ( "adores", -1, 1, "", methodObject ),
|
||||
new Among ( "antes", -1, 1, "", methodObject ),
|
||||
new Among ( "a\u00E7o~es", -1, 1, "", methodObject ),
|
||||
new Among ( "icos", -1, 1, "", methodObject ),
|
||||
new Among ( "ismos", -1, 1, "", methodObject ),
|
||||
new Among ( "osos", -1, 1, "", methodObject ),
|
||||
new Among ( "amentos", -1, 1, "", methodObject ),
|
||||
new Among ( "imentos", -1, 1, "", methodObject ),
|
||||
new Among ( "ivos", -1, 8, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_6[] = {
|
||||
new Among ( "ada", -1, 1, "", this),
|
||||
new Among ( "ida", -1, 1, "", this),
|
||||
new Among ( "ia", -1, 1, "", this),
|
||||
new Among ( "aria", 2, 1, "", this),
|
||||
new Among ( "eria", 2, 1, "", this),
|
||||
new Among ( "iria", 2, 1, "", this),
|
||||
new Among ( "ara", -1, 1, "", this),
|
||||
new Among ( "era", -1, 1, "", this),
|
||||
new Among ( "ira", -1, 1, "", this),
|
||||
new Among ( "ava", -1, 1, "", this),
|
||||
new Among ( "asse", -1, 1, "", this),
|
||||
new Among ( "esse", -1, 1, "", this),
|
||||
new Among ( "isse", -1, 1, "", this),
|
||||
new Among ( "aste", -1, 1, "", this),
|
||||
new Among ( "este", -1, 1, "", this),
|
||||
new Among ( "iste", -1, 1, "", this),
|
||||
new Among ( "ei", -1, 1, "", this),
|
||||
new Among ( "arei", 16, 1, "", this),
|
||||
new Among ( "erei", 16, 1, "", this),
|
||||
new Among ( "irei", 16, 1, "", this),
|
||||
new Among ( "am", -1, 1, "", this),
|
||||
new Among ( "iam", 20, 1, "", this),
|
||||
new Among ( "ariam", 21, 1, "", this),
|
||||
new Among ( "eriam", 21, 1, "", this),
|
||||
new Among ( "iriam", 21, 1, "", this),
|
||||
new Among ( "aram", 20, 1, "", this),
|
||||
new Among ( "eram", 20, 1, "", this),
|
||||
new Among ( "iram", 20, 1, "", this),
|
||||
new Among ( "avam", 20, 1, "", this),
|
||||
new Among ( "em", -1, 1, "", this),
|
||||
new Among ( "arem", 29, 1, "", this),
|
||||
new Among ( "erem", 29, 1, "", this),
|
||||
new Among ( "irem", 29, 1, "", this),
|
||||
new Among ( "assem", 29, 1, "", this),
|
||||
new Among ( "essem", 29, 1, "", this),
|
||||
new Among ( "issem", 29, 1, "", this),
|
||||
new Among ( "ado", -1, 1, "", this),
|
||||
new Among ( "ido", -1, 1, "", this),
|
||||
new Among ( "ando", -1, 1, "", this),
|
||||
new Among ( "endo", -1, 1, "", this),
|
||||
new Among ( "indo", -1, 1, "", this),
|
||||
new Among ( "ara~o", -1, 1, "", this),
|
||||
new Among ( "era~o", -1, 1, "", this),
|
||||
new Among ( "ira~o", -1, 1, "", this),
|
||||
new Among ( "ar", -1, 1, "", this),
|
||||
new Among ( "er", -1, 1, "", this),
|
||||
new Among ( "ir", -1, 1, "", this),
|
||||
new Among ( "as", -1, 1, "", this),
|
||||
new Among ( "adas", 47, 1, "", this),
|
||||
new Among ( "idas", 47, 1, "", this),
|
||||
new Among ( "ias", 47, 1, "", this),
|
||||
new Among ( "arias", 50, 1, "", this),
|
||||
new Among ( "erias", 50, 1, "", this),
|
||||
new Among ( "irias", 50, 1, "", this),
|
||||
new Among ( "aras", 47, 1, "", this),
|
||||
new Among ( "eras", 47, 1, "", this),
|
||||
new Among ( "iras", 47, 1, "", this),
|
||||
new Among ( "avas", 47, 1, "", this),
|
||||
new Among ( "es", -1, 1, "", this),
|
||||
new Among ( "ardes", 58, 1, "", this),
|
||||
new Among ( "erdes", 58, 1, "", this),
|
||||
new Among ( "irdes", 58, 1, "", this),
|
||||
new Among ( "ares", 58, 1, "", this),
|
||||
new Among ( "eres", 58, 1, "", this),
|
||||
new Among ( "ires", 58, 1, "", this),
|
||||
new Among ( "asses", 58, 1, "", this),
|
||||
new Among ( "esses", 58, 1, "", this),
|
||||
new Among ( "isses", 58, 1, "", this),
|
||||
new Among ( "astes", 58, 1, "", this),
|
||||
new Among ( "estes", 58, 1, "", this),
|
||||
new Among ( "istes", 58, 1, "", this),
|
||||
new Among ( "is", -1, 1, "", this),
|
||||
new Among ( "ais", 71, 1, "", this),
|
||||
new Among ( "eis", 71, 1, "", this),
|
||||
new Among ( "areis", 73, 1, "", this),
|
||||
new Among ( "ereis", 73, 1, "", this),
|
||||
new Among ( "ireis", 73, 1, "", this),
|
||||
new Among ( "\u00E1reis", 73, 1, "", this),
|
||||
new Among ( "\u00E9reis", 73, 1, "", this),
|
||||
new Among ( "\u00EDreis", 73, 1, "", this),
|
||||
new Among ( "\u00E1sseis", 73, 1, "", this),
|
||||
new Among ( "\u00E9sseis", 73, 1, "", this),
|
||||
new Among ( "\u00EDsseis", 73, 1, "", this),
|
||||
new Among ( "\u00E1veis", 73, 1, "", this),
|
||||
new Among ( "\u00EDeis", 73, 1, "", this),
|
||||
new Among ( "ar\u00EDeis", 84, 1, "", this),
|
||||
new Among ( "er\u00EDeis", 84, 1, "", this),
|
||||
new Among ( "ir\u00EDeis", 84, 1, "", this),
|
||||
new Among ( "ados", -1, 1, "", this),
|
||||
new Among ( "idos", -1, 1, "", this),
|
||||
new Among ( "amos", -1, 1, "", this),
|
||||
new Among ( "\u00E1ramos", 90, 1, "", this),
|
||||
new Among ( "\u00E9ramos", 90, 1, "", this),
|
||||
new Among ( "\u00EDramos", 90, 1, "", this),
|
||||
new Among ( "\u00E1vamos", 90, 1, "", this),
|
||||
new Among ( "\u00EDamos", 90, 1, "", this),
|
||||
new Among ( "ar\u00EDamos", 95, 1, "", this),
|
||||
new Among ( "er\u00EDamos", 95, 1, "", this),
|
||||
new Among ( "ir\u00EDamos", 95, 1, "", this),
|
||||
new Among ( "emos", -1, 1, "", this),
|
||||
new Among ( "aremos", 99, 1, "", this),
|
||||
new Among ( "eremos", 99, 1, "", this),
|
||||
new Among ( "iremos", 99, 1, "", this),
|
||||
new Among ( "\u00E1ssemos", 99, 1, "", this),
|
||||
new Among ( "\u00EAssemos", 99, 1, "", this),
|
||||
new Among ( "\u00EDssemos", 99, 1, "", this),
|
||||
new Among ( "imos", -1, 1, "", this),
|
||||
new Among ( "armos", -1, 1, "", this),
|
||||
new Among ( "ermos", -1, 1, "", this),
|
||||
new Among ( "irmos", -1, 1, "", this),
|
||||
new Among ( "\u00E1mos", -1, 1, "", this),
|
||||
new Among ( "ar\u00E1s", -1, 1, "", this),
|
||||
new Among ( "er\u00E1s", -1, 1, "", this),
|
||||
new Among ( "ir\u00E1s", -1, 1, "", this),
|
||||
new Among ( "eu", -1, 1, "", this),
|
||||
new Among ( "iu", -1, 1, "", this),
|
||||
new Among ( "ou", -1, 1, "", this),
|
||||
new Among ( "ar\u00E1", -1, 1, "", this),
|
||||
new Among ( "er\u00E1", -1, 1, "", this),
|
||||
new Among ( "ir\u00E1", -1, 1, "", this)
|
||||
private final static Among a_6[] = {
|
||||
new Among ( "ada", -1, 1, "", methodObject ),
|
||||
new Among ( "ida", -1, 1, "", methodObject ),
|
||||
new Among ( "ia", -1, 1, "", methodObject ),
|
||||
new Among ( "aria", 2, 1, "", methodObject ),
|
||||
new Among ( "eria", 2, 1, "", methodObject ),
|
||||
new Among ( "iria", 2, 1, "", methodObject ),
|
||||
new Among ( "ara", -1, 1, "", methodObject ),
|
||||
new Among ( "era", -1, 1, "", methodObject ),
|
||||
new Among ( "ira", -1, 1, "", methodObject ),
|
||||
new Among ( "ava", -1, 1, "", methodObject ),
|
||||
new Among ( "asse", -1, 1, "", methodObject ),
|
||||
new Among ( "esse", -1, 1, "", methodObject ),
|
||||
new Among ( "isse", -1, 1, "", methodObject ),
|
||||
new Among ( "aste", -1, 1, "", methodObject ),
|
||||
new Among ( "este", -1, 1, "", methodObject ),
|
||||
new Among ( "iste", -1, 1, "", methodObject ),
|
||||
new Among ( "ei", -1, 1, "", methodObject ),
|
||||
new Among ( "arei", 16, 1, "", methodObject ),
|
||||
new Among ( "erei", 16, 1, "", methodObject ),
|
||||
new Among ( "irei", 16, 1, "", methodObject ),
|
||||
new Among ( "am", -1, 1, "", methodObject ),
|
||||
new Among ( "iam", 20, 1, "", methodObject ),
|
||||
new Among ( "ariam", 21, 1, "", methodObject ),
|
||||
new Among ( "eriam", 21, 1, "", methodObject ),
|
||||
new Among ( "iriam", 21, 1, "", methodObject ),
|
||||
new Among ( "aram", 20, 1, "", methodObject ),
|
||||
new Among ( "eram", 20, 1, "", methodObject ),
|
||||
new Among ( "iram", 20, 1, "", methodObject ),
|
||||
new Among ( "avam", 20, 1, "", methodObject ),
|
||||
new Among ( "em", -1, 1, "", methodObject ),
|
||||
new Among ( "arem", 29, 1, "", methodObject ),
|
||||
new Among ( "erem", 29, 1, "", methodObject ),
|
||||
new Among ( "irem", 29, 1, "", methodObject ),
|
||||
new Among ( "assem", 29, 1, "", methodObject ),
|
||||
new Among ( "essem", 29, 1, "", methodObject ),
|
||||
new Among ( "issem", 29, 1, "", methodObject ),
|
||||
new Among ( "ado", -1, 1, "", methodObject ),
|
||||
new Among ( "ido", -1, 1, "", methodObject ),
|
||||
new Among ( "ando", -1, 1, "", methodObject ),
|
||||
new Among ( "endo", -1, 1, "", methodObject ),
|
||||
new Among ( "indo", -1, 1, "", methodObject ),
|
||||
new Among ( "ara~o", -1, 1, "", methodObject ),
|
||||
new Among ( "era~o", -1, 1, "", methodObject ),
|
||||
new Among ( "ira~o", -1, 1, "", methodObject ),
|
||||
new Among ( "ar", -1, 1, "", methodObject ),
|
||||
new Among ( "er", -1, 1, "", methodObject ),
|
||||
new Among ( "ir", -1, 1, "", methodObject ),
|
||||
new Among ( "as", -1, 1, "", methodObject ),
|
||||
new Among ( "adas", 47, 1, "", methodObject ),
|
||||
new Among ( "idas", 47, 1, "", methodObject ),
|
||||
new Among ( "ias", 47, 1, "", methodObject ),
|
||||
new Among ( "arias", 50, 1, "", methodObject ),
|
||||
new Among ( "erias", 50, 1, "", methodObject ),
|
||||
new Among ( "irias", 50, 1, "", methodObject ),
|
||||
new Among ( "aras", 47, 1, "", methodObject ),
|
||||
new Among ( "eras", 47, 1, "", methodObject ),
|
||||
new Among ( "iras", 47, 1, "", methodObject ),
|
||||
new Among ( "avas", 47, 1, "", methodObject ),
|
||||
new Among ( "es", -1, 1, "", methodObject ),
|
||||
new Among ( "ardes", 58, 1, "", methodObject ),
|
||||
new Among ( "erdes", 58, 1, "", methodObject ),
|
||||
new Among ( "irdes", 58, 1, "", methodObject ),
|
||||
new Among ( "ares", 58, 1, "", methodObject ),
|
||||
new Among ( "eres", 58, 1, "", methodObject ),
|
||||
new Among ( "ires", 58, 1, "", methodObject ),
|
||||
new Among ( "asses", 58, 1, "", methodObject ),
|
||||
new Among ( "esses", 58, 1, "", methodObject ),
|
||||
new Among ( "isses", 58, 1, "", methodObject ),
|
||||
new Among ( "astes", 58, 1, "", methodObject ),
|
||||
new Among ( "estes", 58, 1, "", methodObject ),
|
||||
new Among ( "istes", 58, 1, "", methodObject ),
|
||||
new Among ( "is", -1, 1, "", methodObject ),
|
||||
new Among ( "ais", 71, 1, "", methodObject ),
|
||||
new Among ( "eis", 71, 1, "", methodObject ),
|
||||
new Among ( "areis", 73, 1, "", methodObject ),
|
||||
new Among ( "ereis", 73, 1, "", methodObject ),
|
||||
new Among ( "ireis", 73, 1, "", methodObject ),
|
||||
new Among ( "\u00E1reis", 73, 1, "", methodObject ),
|
||||
new Among ( "\u00E9reis", 73, 1, "", methodObject ),
|
||||
new Among ( "\u00EDreis", 73, 1, "", methodObject ),
|
||||
new Among ( "\u00E1sseis", 73, 1, "", methodObject ),
|
||||
new Among ( "\u00E9sseis", 73, 1, "", methodObject ),
|
||||
new Among ( "\u00EDsseis", 73, 1, "", methodObject ),
|
||||
new Among ( "\u00E1veis", 73, 1, "", methodObject ),
|
||||
new Among ( "\u00EDeis", 73, 1, "", methodObject ),
|
||||
new Among ( "ar\u00EDeis", 84, 1, "", methodObject ),
|
||||
new Among ( "er\u00EDeis", 84, 1, "", methodObject ),
|
||||
new Among ( "ir\u00EDeis", 84, 1, "", methodObject ),
|
||||
new Among ( "ados", -1, 1, "", methodObject ),
|
||||
new Among ( "idos", -1, 1, "", methodObject ),
|
||||
new Among ( "amos", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E1ramos", 90, 1, "", methodObject ),
|
||||
new Among ( "\u00E9ramos", 90, 1, "", methodObject ),
|
||||
new Among ( "\u00EDramos", 90, 1, "", methodObject ),
|
||||
new Among ( "\u00E1vamos", 90, 1, "", methodObject ),
|
||||
new Among ( "\u00EDamos", 90, 1, "", methodObject ),
|
||||
new Among ( "ar\u00EDamos", 95, 1, "", methodObject ),
|
||||
new Among ( "er\u00EDamos", 95, 1, "", methodObject ),
|
||||
new Among ( "ir\u00EDamos", 95, 1, "", methodObject ),
|
||||
new Among ( "emos", -1, 1, "", methodObject ),
|
||||
new Among ( "aremos", 99, 1, "", methodObject ),
|
||||
new Among ( "eremos", 99, 1, "", methodObject ),
|
||||
new Among ( "iremos", 99, 1, "", methodObject ),
|
||||
new Among ( "\u00E1ssemos", 99, 1, "", methodObject ),
|
||||
new Among ( "\u00EAssemos", 99, 1, "", methodObject ),
|
||||
new Among ( "\u00EDssemos", 99, 1, "", methodObject ),
|
||||
new Among ( "imos", -1, 1, "", methodObject ),
|
||||
new Among ( "armos", -1, 1, "", methodObject ),
|
||||
new Among ( "ermos", -1, 1, "", methodObject ),
|
||||
new Among ( "irmos", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E1mos", -1, 1, "", methodObject ),
|
||||
new Among ( "ar\u00E1s", -1, 1, "", methodObject ),
|
||||
new Among ( "er\u00E1s", -1, 1, "", methodObject ),
|
||||
new Among ( "ir\u00E1s", -1, 1, "", methodObject ),
|
||||
new Among ( "eu", -1, 1, "", methodObject ),
|
||||
new Among ( "iu", -1, 1, "", methodObject ),
|
||||
new Among ( "ou", -1, 1, "", methodObject ),
|
||||
new Among ( "ar\u00E1", -1, 1, "", methodObject ),
|
||||
new Among ( "er\u00E1", -1, 1, "", methodObject ),
|
||||
new Among ( "ir\u00E1", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_7[] = {
|
||||
new Among ( "a", -1, 1, "", this),
|
||||
new Among ( "i", -1, 1, "", this),
|
||||
new Among ( "o", -1, 1, "", this),
|
||||
new Among ( "os", -1, 1, "", this),
|
||||
new Among ( "\u00E1", -1, 1, "", this),
|
||||
new Among ( "\u00ED", -1, 1, "", this),
|
||||
new Among ( "\u00F3", -1, 1, "", this)
|
||||
private final static Among a_7[] = {
|
||||
new Among ( "a", -1, 1, "", methodObject ),
|
||||
new Among ( "i", -1, 1, "", methodObject ),
|
||||
new Among ( "o", -1, 1, "", methodObject ),
|
||||
new Among ( "os", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E1", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00ED", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00F3", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_8[] = {
|
||||
new Among ( "e", -1, 1, "", this),
|
||||
new Among ( "\u00E7", -1, 2, "", this),
|
||||
new Among ( "\u00E9", -1, 1, "", this),
|
||||
new Among ( "\u00EA", -1, 1, "", this)
|
||||
private final static Among a_8[] = {
|
||||
new Among ( "e", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E7", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00E9", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00EA", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 3, 19, 12, 2 };
|
||||
|
@ -1112,5 +1119,15 @@ public class PortugueseStemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof PortugueseStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return PortugueseStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,256 +1,263 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class RomanianStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "", -1, 3, "", this),
|
||||
new Among ( "I", 0, 1, "", this),
|
||||
new Among ( "U", 0, 2, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static RomanianStemmer methodObject = new RomanianStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "", -1, 3, "", methodObject ),
|
||||
new Among ( "I", 0, 1, "", methodObject ),
|
||||
new Among ( "U", 0, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "ea", -1, 3, "", this),
|
||||
new Among ( "a\u0163ia", -1, 7, "", this),
|
||||
new Among ( "aua", -1, 2, "", this),
|
||||
new Among ( "iua", -1, 4, "", this),
|
||||
new Among ( "a\u0163ie", -1, 7, "", this),
|
||||
new Among ( "ele", -1, 3, "", this),
|
||||
new Among ( "ile", -1, 5, "", this),
|
||||
new Among ( "iile", 6, 4, "", this),
|
||||
new Among ( "iei", -1, 4, "", this),
|
||||
new Among ( "atei", -1, 6, "", this),
|
||||
new Among ( "ii", -1, 4, "", this),
|
||||
new Among ( "ului", -1, 1, "", this),
|
||||
new Among ( "ul", -1, 1, "", this),
|
||||
new Among ( "elor", -1, 3, "", this),
|
||||
new Among ( "ilor", -1, 4, "", this),
|
||||
new Among ( "iilor", 14, 4, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "ea", -1, 3, "", methodObject ),
|
||||
new Among ( "a\u0163ia", -1, 7, "", methodObject ),
|
||||
new Among ( "aua", -1, 2, "", methodObject ),
|
||||
new Among ( "iua", -1, 4, "", methodObject ),
|
||||
new Among ( "a\u0163ie", -1, 7, "", methodObject ),
|
||||
new Among ( "ele", -1, 3, "", methodObject ),
|
||||
new Among ( "ile", -1, 5, "", methodObject ),
|
||||
new Among ( "iile", 6, 4, "", methodObject ),
|
||||
new Among ( "iei", -1, 4, "", methodObject ),
|
||||
new Among ( "atei", -1, 6, "", methodObject ),
|
||||
new Among ( "ii", -1, 4, "", methodObject ),
|
||||
new Among ( "ului", -1, 1, "", methodObject ),
|
||||
new Among ( "ul", -1, 1, "", methodObject ),
|
||||
new Among ( "elor", -1, 3, "", methodObject ),
|
||||
new Among ( "ilor", -1, 4, "", methodObject ),
|
||||
new Among ( "iilor", 14, 4, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "icala", -1, 4, "", this),
|
||||
new Among ( "iciva", -1, 4, "", this),
|
||||
new Among ( "ativa", -1, 5, "", this),
|
||||
new Among ( "itiva", -1, 6, "", this),
|
||||
new Among ( "icale", -1, 4, "", this),
|
||||
new Among ( "a\u0163iune", -1, 5, "", this),
|
||||
new Among ( "i\u0163iune", -1, 6, "", this),
|
||||
new Among ( "atoare", -1, 5, "", this),
|
||||
new Among ( "itoare", -1, 6, "", this),
|
||||
new Among ( "\u0103toare", -1, 5, "", this),
|
||||
new Among ( "icitate", -1, 4, "", this),
|
||||
new Among ( "abilitate", -1, 1, "", this),
|
||||
new Among ( "ibilitate", -1, 2, "", this),
|
||||
new Among ( "ivitate", -1, 3, "", this),
|
||||
new Among ( "icive", -1, 4, "", this),
|
||||
new Among ( "ative", -1, 5, "", this),
|
||||
new Among ( "itive", -1, 6, "", this),
|
||||
new Among ( "icali", -1, 4, "", this),
|
||||
new Among ( "atori", -1, 5, "", this),
|
||||
new Among ( "icatori", 18, 4, "", this),
|
||||
new Among ( "itori", -1, 6, "", this),
|
||||
new Among ( "\u0103tori", -1, 5, "", this),
|
||||
new Among ( "icitati", -1, 4, "", this),
|
||||
new Among ( "abilitati", -1, 1, "", this),
|
||||
new Among ( "ivitati", -1, 3, "", this),
|
||||
new Among ( "icivi", -1, 4, "", this),
|
||||
new Among ( "ativi", -1, 5, "", this),
|
||||
new Among ( "itivi", -1, 6, "", this),
|
||||
new Among ( "icit\u0103i", -1, 4, "", this),
|
||||
new Among ( "abilit\u0103i", -1, 1, "", this),
|
||||
new Among ( "ivit\u0103i", -1, 3, "", this),
|
||||
new Among ( "icit\u0103\u0163i", -1, 4, "", this),
|
||||
new Among ( "abilit\u0103\u0163i", -1, 1, "", this),
|
||||
new Among ( "ivit\u0103\u0163i", -1, 3, "", this),
|
||||
new Among ( "ical", -1, 4, "", this),
|
||||
new Among ( "ator", -1, 5, "", this),
|
||||
new Among ( "icator", 35, 4, "", this),
|
||||
new Among ( "itor", -1, 6, "", this),
|
||||
new Among ( "\u0103tor", -1, 5, "", this),
|
||||
new Among ( "iciv", -1, 4, "", this),
|
||||
new Among ( "ativ", -1, 5, "", this),
|
||||
new Among ( "itiv", -1, 6, "", this),
|
||||
new Among ( "ical\u0103", -1, 4, "", this),
|
||||
new Among ( "iciv\u0103", -1, 4, "", this),
|
||||
new Among ( "ativ\u0103", -1, 5, "", this),
|
||||
new Among ( "itiv\u0103", -1, 6, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "icala", -1, 4, "", methodObject ),
|
||||
new Among ( "iciva", -1, 4, "", methodObject ),
|
||||
new Among ( "ativa", -1, 5, "", methodObject ),
|
||||
new Among ( "itiva", -1, 6, "", methodObject ),
|
||||
new Among ( "icale", -1, 4, "", methodObject ),
|
||||
new Among ( "a\u0163iune", -1, 5, "", methodObject ),
|
||||
new Among ( "i\u0163iune", -1, 6, "", methodObject ),
|
||||
new Among ( "atoare", -1, 5, "", methodObject ),
|
||||
new Among ( "itoare", -1, 6, "", methodObject ),
|
||||
new Among ( "\u0103toare", -1, 5, "", methodObject ),
|
||||
new Among ( "icitate", -1, 4, "", methodObject ),
|
||||
new Among ( "abilitate", -1, 1, "", methodObject ),
|
||||
new Among ( "ibilitate", -1, 2, "", methodObject ),
|
||||
new Among ( "ivitate", -1, 3, "", methodObject ),
|
||||
new Among ( "icive", -1, 4, "", methodObject ),
|
||||
new Among ( "ative", -1, 5, "", methodObject ),
|
||||
new Among ( "itive", -1, 6, "", methodObject ),
|
||||
new Among ( "icali", -1, 4, "", methodObject ),
|
||||
new Among ( "atori", -1, 5, "", methodObject ),
|
||||
new Among ( "icatori", 18, 4, "", methodObject ),
|
||||
new Among ( "itori", -1, 6, "", methodObject ),
|
||||
new Among ( "\u0103tori", -1, 5, "", methodObject ),
|
||||
new Among ( "icitati", -1, 4, "", methodObject ),
|
||||
new Among ( "abilitati", -1, 1, "", methodObject ),
|
||||
new Among ( "ivitati", -1, 3, "", methodObject ),
|
||||
new Among ( "icivi", -1, 4, "", methodObject ),
|
||||
new Among ( "ativi", -1, 5, "", methodObject ),
|
||||
new Among ( "itivi", -1, 6, "", methodObject ),
|
||||
new Among ( "icit\u0103i", -1, 4, "", methodObject ),
|
||||
new Among ( "abilit\u0103i", -1, 1, "", methodObject ),
|
||||
new Among ( "ivit\u0103i", -1, 3, "", methodObject ),
|
||||
new Among ( "icit\u0103\u0163i", -1, 4, "", methodObject ),
|
||||
new Among ( "abilit\u0103\u0163i", -1, 1, "", methodObject ),
|
||||
new Among ( "ivit\u0103\u0163i", -1, 3, "", methodObject ),
|
||||
new Among ( "ical", -1, 4, "", methodObject ),
|
||||
new Among ( "ator", -1, 5, "", methodObject ),
|
||||
new Among ( "icator", 35, 4, "", methodObject ),
|
||||
new Among ( "itor", -1, 6, "", methodObject ),
|
||||
new Among ( "\u0103tor", -1, 5, "", methodObject ),
|
||||
new Among ( "iciv", -1, 4, "", methodObject ),
|
||||
new Among ( "ativ", -1, 5, "", methodObject ),
|
||||
new Among ( "itiv", -1, 6, "", methodObject ),
|
||||
new Among ( "ical\u0103", -1, 4, "", methodObject ),
|
||||
new Among ( "iciv\u0103", -1, 4, "", methodObject ),
|
||||
new Among ( "ativ\u0103", -1, 5, "", methodObject ),
|
||||
new Among ( "itiv\u0103", -1, 6, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "ica", -1, 1, "", this),
|
||||
new Among ( "abila", -1, 1, "", this),
|
||||
new Among ( "ibila", -1, 1, "", this),
|
||||
new Among ( "oasa", -1, 1, "", this),
|
||||
new Among ( "ata", -1, 1, "", this),
|
||||
new Among ( "ita", -1, 1, "", this),
|
||||
new Among ( "anta", -1, 1, "", this),
|
||||
new Among ( "ista", -1, 3, "", this),
|
||||
new Among ( "uta", -1, 1, "", this),
|
||||
new Among ( "iva", -1, 1, "", this),
|
||||
new Among ( "ic", -1, 1, "", this),
|
||||
new Among ( "ice", -1, 1, "", this),
|
||||
new Among ( "abile", -1, 1, "", this),
|
||||
new Among ( "ibile", -1, 1, "", this),
|
||||
new Among ( "isme", -1, 3, "", this),
|
||||
new Among ( "iune", -1, 2, "", this),
|
||||
new Among ( "oase", -1, 1, "", this),
|
||||
new Among ( "ate", -1, 1, "", this),
|
||||
new Among ( "itate", 17, 1, "", this),
|
||||
new Among ( "ite", -1, 1, "", this),
|
||||
new Among ( "ante", -1, 1, "", this),
|
||||
new Among ( "iste", -1, 3, "", this),
|
||||
new Among ( "ute", -1, 1, "", this),
|
||||
new Among ( "ive", -1, 1, "", this),
|
||||
new Among ( "ici", -1, 1, "", this),
|
||||
new Among ( "abili", -1, 1, "", this),
|
||||
new Among ( "ibili", -1, 1, "", this),
|
||||
new Among ( "iuni", -1, 2, "", this),
|
||||
new Among ( "atori", -1, 1, "", this),
|
||||
new Among ( "osi", -1, 1, "", this),
|
||||
new Among ( "ati", -1, 1, "", this),
|
||||
new Among ( "itati", 30, 1, "", this),
|
||||
new Among ( "iti", -1, 1, "", this),
|
||||
new Among ( "anti", -1, 1, "", this),
|
||||
new Among ( "isti", -1, 3, "", this),
|
||||
new Among ( "uti", -1, 1, "", this),
|
||||
new Among ( "i\u015Fti", -1, 3, "", this),
|
||||
new Among ( "ivi", -1, 1, "", this),
|
||||
new Among ( "it\u0103i", -1, 1, "", this),
|
||||
new Among ( "o\u015Fi", -1, 1, "", this),
|
||||
new Among ( "it\u0103\u0163i", -1, 1, "", this),
|
||||
new Among ( "abil", -1, 1, "", this),
|
||||
new Among ( "ibil", -1, 1, "", this),
|
||||
new Among ( "ism", -1, 3, "", this),
|
||||
new Among ( "ator", -1, 1, "", this),
|
||||
new Among ( "os", -1, 1, "", this),
|
||||
new Among ( "at", -1, 1, "", this),
|
||||
new Among ( "it", -1, 1, "", this),
|
||||
new Among ( "ant", -1, 1, "", this),
|
||||
new Among ( "ist", -1, 3, "", this),
|
||||
new Among ( "ut", -1, 1, "", this),
|
||||
new Among ( "iv", -1, 1, "", this),
|
||||
new Among ( "ic\u0103", -1, 1, "", this),
|
||||
new Among ( "abil\u0103", -1, 1, "", this),
|
||||
new Among ( "ibil\u0103", -1, 1, "", this),
|
||||
new Among ( "oas\u0103", -1, 1, "", this),
|
||||
new Among ( "at\u0103", -1, 1, "", this),
|
||||
new Among ( "it\u0103", -1, 1, "", this),
|
||||
new Among ( "ant\u0103", -1, 1, "", this),
|
||||
new Among ( "ist\u0103", -1, 3, "", this),
|
||||
new Among ( "ut\u0103", -1, 1, "", this),
|
||||
new Among ( "iv\u0103", -1, 1, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "ica", -1, 1, "", methodObject ),
|
||||
new Among ( "abila", -1, 1, "", methodObject ),
|
||||
new Among ( "ibila", -1, 1, "", methodObject ),
|
||||
new Among ( "oasa", -1, 1, "", methodObject ),
|
||||
new Among ( "ata", -1, 1, "", methodObject ),
|
||||
new Among ( "ita", -1, 1, "", methodObject ),
|
||||
new Among ( "anta", -1, 1, "", methodObject ),
|
||||
new Among ( "ista", -1, 3, "", methodObject ),
|
||||
new Among ( "uta", -1, 1, "", methodObject ),
|
||||
new Among ( "iva", -1, 1, "", methodObject ),
|
||||
new Among ( "ic", -1, 1, "", methodObject ),
|
||||
new Among ( "ice", -1, 1, "", methodObject ),
|
||||
new Among ( "abile", -1, 1, "", methodObject ),
|
||||
new Among ( "ibile", -1, 1, "", methodObject ),
|
||||
new Among ( "isme", -1, 3, "", methodObject ),
|
||||
new Among ( "iune", -1, 2, "", methodObject ),
|
||||
new Among ( "oase", -1, 1, "", methodObject ),
|
||||
new Among ( "ate", -1, 1, "", methodObject ),
|
||||
new Among ( "itate", 17, 1, "", methodObject ),
|
||||
new Among ( "ite", -1, 1, "", methodObject ),
|
||||
new Among ( "ante", -1, 1, "", methodObject ),
|
||||
new Among ( "iste", -1, 3, "", methodObject ),
|
||||
new Among ( "ute", -1, 1, "", methodObject ),
|
||||
new Among ( "ive", -1, 1, "", methodObject ),
|
||||
new Among ( "ici", -1, 1, "", methodObject ),
|
||||
new Among ( "abili", -1, 1, "", methodObject ),
|
||||
new Among ( "ibili", -1, 1, "", methodObject ),
|
||||
new Among ( "iuni", -1, 2, "", methodObject ),
|
||||
new Among ( "atori", -1, 1, "", methodObject ),
|
||||
new Among ( "osi", -1, 1, "", methodObject ),
|
||||
new Among ( "ati", -1, 1, "", methodObject ),
|
||||
new Among ( "itati", 30, 1, "", methodObject ),
|
||||
new Among ( "iti", -1, 1, "", methodObject ),
|
||||
new Among ( "anti", -1, 1, "", methodObject ),
|
||||
new Among ( "isti", -1, 3, "", methodObject ),
|
||||
new Among ( "uti", -1, 1, "", methodObject ),
|
||||
new Among ( "i\u015Fti", -1, 3, "", methodObject ),
|
||||
new Among ( "ivi", -1, 1, "", methodObject ),
|
||||
new Among ( "it\u0103i", -1, 1, "", methodObject ),
|
||||
new Among ( "o\u015Fi", -1, 1, "", methodObject ),
|
||||
new Among ( "it\u0103\u0163i", -1, 1, "", methodObject ),
|
||||
new Among ( "abil", -1, 1, "", methodObject ),
|
||||
new Among ( "ibil", -1, 1, "", methodObject ),
|
||||
new Among ( "ism", -1, 3, "", methodObject ),
|
||||
new Among ( "ator", -1, 1, "", methodObject ),
|
||||
new Among ( "os", -1, 1, "", methodObject ),
|
||||
new Among ( "at", -1, 1, "", methodObject ),
|
||||
new Among ( "it", -1, 1, "", methodObject ),
|
||||
new Among ( "ant", -1, 1, "", methodObject ),
|
||||
new Among ( "ist", -1, 3, "", methodObject ),
|
||||
new Among ( "ut", -1, 1, "", methodObject ),
|
||||
new Among ( "iv", -1, 1, "", methodObject ),
|
||||
new Among ( "ic\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "abil\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "ibil\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "oas\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "at\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "it\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "ant\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "ist\u0103", -1, 3, "", methodObject ),
|
||||
new Among ( "ut\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "iv\u0103", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "ea", -1, 1, "", this),
|
||||
new Among ( "ia", -1, 1, "", this),
|
||||
new Among ( "esc", -1, 1, "", this),
|
||||
new Among ( "\u0103sc", -1, 1, "", this),
|
||||
new Among ( "ind", -1, 1, "", this),
|
||||
new Among ( "\u00E2nd", -1, 1, "", this),
|
||||
new Among ( "are", -1, 1, "", this),
|
||||
new Among ( "ere", -1, 1, "", this),
|
||||
new Among ( "ire", -1, 1, "", this),
|
||||
new Among ( "\u00E2re", -1, 1, "", this),
|
||||
new Among ( "se", -1, 2, "", this),
|
||||
new Among ( "ase", 10, 1, "", this),
|
||||
new Among ( "sese", 10, 2, "", this),
|
||||
new Among ( "ise", 10, 1, "", this),
|
||||
new Among ( "use", 10, 1, "", this),
|
||||
new Among ( "\u00E2se", 10, 1, "", this),
|
||||
new Among ( "e\u015Fte", -1, 1, "", this),
|
||||
new Among ( "\u0103\u015Fte", -1, 1, "", this),
|
||||
new Among ( "eze", -1, 1, "", this),
|
||||
new Among ( "ai", -1, 1, "", this),
|
||||
new Among ( "eai", 19, 1, "", this),
|
||||
new Among ( "iai", 19, 1, "", this),
|
||||
new Among ( "sei", -1, 2, "", this),
|
||||
new Among ( "e\u015Fti", -1, 1, "", this),
|
||||
new Among ( "\u0103\u015Fti", -1, 1, "", this),
|
||||
new Among ( "ui", -1, 1, "", this),
|
||||
new Among ( "ezi", -1, 1, "", this),
|
||||
new Among ( "\u00E2i", -1, 1, "", this),
|
||||
new Among ( "a\u015Fi", -1, 1, "", this),
|
||||
new Among ( "se\u015Fi", -1, 2, "", this),
|
||||
new Among ( "ase\u015Fi", 29, 1, "", this),
|
||||
new Among ( "sese\u015Fi", 29, 2, "", this),
|
||||
new Among ( "ise\u015Fi", 29, 1, "", this),
|
||||
new Among ( "use\u015Fi", 29, 1, "", this),
|
||||
new Among ( "\u00E2se\u015Fi", 29, 1, "", this),
|
||||
new Among ( "i\u015Fi", -1, 1, "", this),
|
||||
new Among ( "u\u015Fi", -1, 1, "", this),
|
||||
new Among ( "\u00E2\u015Fi", -1, 1, "", this),
|
||||
new Among ( "a\u0163i", -1, 2, "", this),
|
||||
new Among ( "ea\u0163i", 38, 1, "", this),
|
||||
new Among ( "ia\u0163i", 38, 1, "", this),
|
||||
new Among ( "e\u0163i", -1, 2, "", this),
|
||||
new Among ( "i\u0163i", -1, 2, "", this),
|
||||
new Among ( "\u00E2\u0163i", -1, 2, "", this),
|
||||
new Among ( "ar\u0103\u0163i", -1, 1, "", this),
|
||||
new Among ( "ser\u0103\u0163i", -1, 2, "", this),
|
||||
new Among ( "aser\u0103\u0163i", 45, 1, "", this),
|
||||
new Among ( "seser\u0103\u0163i", 45, 2, "", this),
|
||||
new Among ( "iser\u0103\u0163i", 45, 1, "", this),
|
||||
new Among ( "user\u0103\u0163i", 45, 1, "", this),
|
||||
new Among ( "\u00E2ser\u0103\u0163i", 45, 1, "", this),
|
||||
new Among ( "ir\u0103\u0163i", -1, 1, "", this),
|
||||
new Among ( "ur\u0103\u0163i", -1, 1, "", this),
|
||||
new Among ( "\u00E2r\u0103\u0163i", -1, 1, "", this),
|
||||
new Among ( "am", -1, 1, "", this),
|
||||
new Among ( "eam", 54, 1, "", this),
|
||||
new Among ( "iam", 54, 1, "", this),
|
||||
new Among ( "em", -1, 2, "", this),
|
||||
new Among ( "asem", 57, 1, "", this),
|
||||
new Among ( "sesem", 57, 2, "", this),
|
||||
new Among ( "isem", 57, 1, "", this),
|
||||
new Among ( "usem", 57, 1, "", this),
|
||||
new Among ( "\u00E2sem", 57, 1, "", this),
|
||||
new Among ( "im", -1, 2, "", this),
|
||||
new Among ( "\u00E2m", -1, 2, "", this),
|
||||
new Among ( "\u0103m", -1, 2, "", this),
|
||||
new Among ( "ar\u0103m", 65, 1, "", this),
|
||||
new Among ( "ser\u0103m", 65, 2, "", this),
|
||||
new Among ( "aser\u0103m", 67, 1, "", this),
|
||||
new Among ( "seser\u0103m", 67, 2, "", this),
|
||||
new Among ( "iser\u0103m", 67, 1, "", this),
|
||||
new Among ( "user\u0103m", 67, 1, "", this),
|
||||
new Among ( "\u00E2ser\u0103m", 67, 1, "", this),
|
||||
new Among ( "ir\u0103m", 65, 1, "", this),
|
||||
new Among ( "ur\u0103m", 65, 1, "", this),
|
||||
new Among ( "\u00E2r\u0103m", 65, 1, "", this),
|
||||
new Among ( "au", -1, 1, "", this),
|
||||
new Among ( "eau", 76, 1, "", this),
|
||||
new Among ( "iau", 76, 1, "", this),
|
||||
new Among ( "indu", -1, 1, "", this),
|
||||
new Among ( "\u00E2ndu", -1, 1, "", this),
|
||||
new Among ( "ez", -1, 1, "", this),
|
||||
new Among ( "easc\u0103", -1, 1, "", this),
|
||||
new Among ( "ar\u0103", -1, 1, "", this),
|
||||
new Among ( "ser\u0103", -1, 2, "", this),
|
||||
new Among ( "aser\u0103", 84, 1, "", this),
|
||||
new Among ( "seser\u0103", 84, 2, "", this),
|
||||
new Among ( "iser\u0103", 84, 1, "", this),
|
||||
new Among ( "user\u0103", 84, 1, "", this),
|
||||
new Among ( "\u00E2ser\u0103", 84, 1, "", this),
|
||||
new Among ( "ir\u0103", -1, 1, "", this),
|
||||
new Among ( "ur\u0103", -1, 1, "", this),
|
||||
new Among ( "\u00E2r\u0103", -1, 1, "", this),
|
||||
new Among ( "eaz\u0103", -1, 1, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "ea", -1, 1, "", methodObject ),
|
||||
new Among ( "ia", -1, 1, "", methodObject ),
|
||||
new Among ( "esc", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0103sc", -1, 1, "", methodObject ),
|
||||
new Among ( "ind", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E2nd", -1, 1, "", methodObject ),
|
||||
new Among ( "are", -1, 1, "", methodObject ),
|
||||
new Among ( "ere", -1, 1, "", methodObject ),
|
||||
new Among ( "ire", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E2re", -1, 1, "", methodObject ),
|
||||
new Among ( "se", -1, 2, "", methodObject ),
|
||||
new Among ( "ase", 10, 1, "", methodObject ),
|
||||
new Among ( "sese", 10, 2, "", methodObject ),
|
||||
new Among ( "ise", 10, 1, "", methodObject ),
|
||||
new Among ( "use", 10, 1, "", methodObject ),
|
||||
new Among ( "\u00E2se", 10, 1, "", methodObject ),
|
||||
new Among ( "e\u015Fte", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0103\u015Fte", -1, 1, "", methodObject ),
|
||||
new Among ( "eze", -1, 1, "", methodObject ),
|
||||
new Among ( "ai", -1, 1, "", methodObject ),
|
||||
new Among ( "eai", 19, 1, "", methodObject ),
|
||||
new Among ( "iai", 19, 1, "", methodObject ),
|
||||
new Among ( "sei", -1, 2, "", methodObject ),
|
||||
new Among ( "e\u015Fti", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0103\u015Fti", -1, 1, "", methodObject ),
|
||||
new Among ( "ui", -1, 1, "", methodObject ),
|
||||
new Among ( "ezi", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E2i", -1, 1, "", methodObject ),
|
||||
new Among ( "a\u015Fi", -1, 1, "", methodObject ),
|
||||
new Among ( "se\u015Fi", -1, 2, "", methodObject ),
|
||||
new Among ( "ase\u015Fi", 29, 1, "", methodObject ),
|
||||
new Among ( "sese\u015Fi", 29, 2, "", methodObject ),
|
||||
new Among ( "ise\u015Fi", 29, 1, "", methodObject ),
|
||||
new Among ( "use\u015Fi", 29, 1, "", methodObject ),
|
||||
new Among ( "\u00E2se\u015Fi", 29, 1, "", methodObject ),
|
||||
new Among ( "i\u015Fi", -1, 1, "", methodObject ),
|
||||
new Among ( "u\u015Fi", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E2\u015Fi", -1, 1, "", methodObject ),
|
||||
new Among ( "a\u0163i", -1, 2, "", methodObject ),
|
||||
new Among ( "ea\u0163i", 38, 1, "", methodObject ),
|
||||
new Among ( "ia\u0163i", 38, 1, "", methodObject ),
|
||||
new Among ( "e\u0163i", -1, 2, "", methodObject ),
|
||||
new Among ( "i\u0163i", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00E2\u0163i", -1, 2, "", methodObject ),
|
||||
new Among ( "ar\u0103\u0163i", -1, 1, "", methodObject ),
|
||||
new Among ( "ser\u0103\u0163i", -1, 2, "", methodObject ),
|
||||
new Among ( "aser\u0103\u0163i", 45, 1, "", methodObject ),
|
||||
new Among ( "seser\u0103\u0163i", 45, 2, "", methodObject ),
|
||||
new Among ( "iser\u0103\u0163i", 45, 1, "", methodObject ),
|
||||
new Among ( "user\u0103\u0163i", 45, 1, "", methodObject ),
|
||||
new Among ( "\u00E2ser\u0103\u0163i", 45, 1, "", methodObject ),
|
||||
new Among ( "ir\u0103\u0163i", -1, 1, "", methodObject ),
|
||||
new Among ( "ur\u0103\u0163i", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E2r\u0103\u0163i", -1, 1, "", methodObject ),
|
||||
new Among ( "am", -1, 1, "", methodObject ),
|
||||
new Among ( "eam", 54, 1, "", methodObject ),
|
||||
new Among ( "iam", 54, 1, "", methodObject ),
|
||||
new Among ( "em", -1, 2, "", methodObject ),
|
||||
new Among ( "asem", 57, 1, "", methodObject ),
|
||||
new Among ( "sesem", 57, 2, "", methodObject ),
|
||||
new Among ( "isem", 57, 1, "", methodObject ),
|
||||
new Among ( "usem", 57, 1, "", methodObject ),
|
||||
new Among ( "\u00E2sem", 57, 1, "", methodObject ),
|
||||
new Among ( "im", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00E2m", -1, 2, "", methodObject ),
|
||||
new Among ( "\u0103m", -1, 2, "", methodObject ),
|
||||
new Among ( "ar\u0103m", 65, 1, "", methodObject ),
|
||||
new Among ( "ser\u0103m", 65, 2, "", methodObject ),
|
||||
new Among ( "aser\u0103m", 67, 1, "", methodObject ),
|
||||
new Among ( "seser\u0103m", 67, 2, "", methodObject ),
|
||||
new Among ( "iser\u0103m", 67, 1, "", methodObject ),
|
||||
new Among ( "user\u0103m", 67, 1, "", methodObject ),
|
||||
new Among ( "\u00E2ser\u0103m", 67, 1, "", methodObject ),
|
||||
new Among ( "ir\u0103m", 65, 1, "", methodObject ),
|
||||
new Among ( "ur\u0103m", 65, 1, "", methodObject ),
|
||||
new Among ( "\u00E2r\u0103m", 65, 1, "", methodObject ),
|
||||
new Among ( "au", -1, 1, "", methodObject ),
|
||||
new Among ( "eau", 76, 1, "", methodObject ),
|
||||
new Among ( "iau", 76, 1, "", methodObject ),
|
||||
new Among ( "indu", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E2ndu", -1, 1, "", methodObject ),
|
||||
new Among ( "ez", -1, 1, "", methodObject ),
|
||||
new Among ( "easc\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "ar\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "ser\u0103", -1, 2, "", methodObject ),
|
||||
new Among ( "aser\u0103", 84, 1, "", methodObject ),
|
||||
new Among ( "seser\u0103", 84, 2, "", methodObject ),
|
||||
new Among ( "iser\u0103", 84, 1, "", methodObject ),
|
||||
new Among ( "user\u0103", 84, 1, "", methodObject ),
|
||||
new Among ( "\u00E2ser\u0103", 84, 1, "", methodObject ),
|
||||
new Among ( "ir\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "ur\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E2r\u0103", -1, 1, "", methodObject ),
|
||||
new Among ( "eaz\u0103", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "a", -1, 1, "", this),
|
||||
new Among ( "e", -1, 1, "", this),
|
||||
new Among ( "ie", 1, 1, "", this),
|
||||
new Among ( "i", -1, 1, "", this),
|
||||
new Among ( "\u0103", -1, 1, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "a", -1, 1, "", methodObject ),
|
||||
new Among ( "e", -1, 1, "", methodObject ),
|
||||
new Among ( "ie", 1, 1, "", methodObject ),
|
||||
new Among ( "i", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0103", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 2, 32, 0, 0, 4 };
|
||||
|
@ -1020,5 +1027,15 @@ public class RomanianStemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof RomanianStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return RomanianStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,169 +1,176 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class RussianStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "\u0432", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0432", 0, 2, "", this),
|
||||
new Among ( "\u044B\u0432", 0, 2, "", this),
|
||||
new Among ( "\u0432\u0448\u0438", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0432\u0448\u0438", 3, 2, "", this),
|
||||
new Among ( "\u044B\u0432\u0448\u0438", 3, 2, "", this),
|
||||
new Among ( "\u0432\u0448\u0438\u0441\u044C", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0432\u0448\u0438\u0441\u044C", 6, 2, "", this),
|
||||
new Among ( "\u044B\u0432\u0448\u0438\u0441\u044C", 6, 2, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static RussianStemmer methodObject = new RussianStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "\u0432", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0432", 0, 2, "", methodObject ),
|
||||
new Among ( "\u044B\u0432", 0, 2, "", methodObject ),
|
||||
new Among ( "\u0432\u0448\u0438", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0432\u0448\u0438", 3, 2, "", methodObject ),
|
||||
new Among ( "\u044B\u0432\u0448\u0438", 3, 2, "", methodObject ),
|
||||
new Among ( "\u0432\u0448\u0438\u0441\u044C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0432\u0448\u0438\u0441\u044C", 6, 2, "", methodObject ),
|
||||
new Among ( "\u044B\u0432\u0448\u0438\u0441\u044C", 6, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "\u0435\u0435", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0435", -1, 1, "", this),
|
||||
new Among ( "\u043E\u0435", -1, 1, "", this),
|
||||
new Among ( "\u044B\u0435", -1, 1, "", this),
|
||||
new Among ( "\u0438\u043C\u0438", -1, 1, "", this),
|
||||
new Among ( "\u044B\u043C\u0438", -1, 1, "", this),
|
||||
new Among ( "\u0435\u0439", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0439", -1, 1, "", this),
|
||||
new Among ( "\u043E\u0439", -1, 1, "", this),
|
||||
new Among ( "\u044B\u0439", -1, 1, "", this),
|
||||
new Among ( "\u0435\u043C", -1, 1, "", this),
|
||||
new Among ( "\u0438\u043C", -1, 1, "", this),
|
||||
new Among ( "\u043E\u043C", -1, 1, "", this),
|
||||
new Among ( "\u044B\u043C", -1, 1, "", this),
|
||||
new Among ( "\u0435\u0433\u043E", -1, 1, "", this),
|
||||
new Among ( "\u043E\u0433\u043E", -1, 1, "", this),
|
||||
new Among ( "\u0435\u043C\u0443", -1, 1, "", this),
|
||||
new Among ( "\u043E\u043C\u0443", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0445", -1, 1, "", this),
|
||||
new Among ( "\u044B\u0445", -1, 1, "", this),
|
||||
new Among ( "\u0435\u044E", -1, 1, "", this),
|
||||
new Among ( "\u043E\u044E", -1, 1, "", this),
|
||||
new Among ( "\u0443\u044E", -1, 1, "", this),
|
||||
new Among ( "\u044E\u044E", -1, 1, "", this),
|
||||
new Among ( "\u0430\u044F", -1, 1, "", this),
|
||||
new Among ( "\u044F\u044F", -1, 1, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "\u0435\u0435", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0435", -1, 1, "", methodObject ),
|
||||
new Among ( "\u043E\u0435", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044B\u0435", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u043C\u0438", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044B\u043C\u0438", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u0439", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0439", -1, 1, "", methodObject ),
|
||||
new Among ( "\u043E\u0439", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044B\u0439", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u043C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u043C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u043E\u043C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044B\u043C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u0433\u043E", -1, 1, "", methodObject ),
|
||||
new Among ( "\u043E\u0433\u043E", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u043C\u0443", -1, 1, "", methodObject ),
|
||||
new Among ( "\u043E\u043C\u0443", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0445", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044B\u0445", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u044E", -1, 1, "", methodObject ),
|
||||
new Among ( "\u043E\u044E", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0443\u044E", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044E\u044E", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0430\u044F", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044F\u044F", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "\u0435\u043C", -1, 1, "", this),
|
||||
new Among ( "\u043D\u043D", -1, 1, "", this),
|
||||
new Among ( "\u0432\u0448", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0432\u0448", 2, 2, "", this),
|
||||
new Among ( "\u044B\u0432\u0448", 2, 2, "", this),
|
||||
new Among ( "\u0449", -1, 1, "", this),
|
||||
new Among ( "\u044E\u0449", 5, 1, "", this),
|
||||
new Among ( "\u0443\u044E\u0449", 6, 2, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "\u0435\u043C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u043D\u043D", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0432\u0448", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0432\u0448", 2, 2, "", methodObject ),
|
||||
new Among ( "\u044B\u0432\u0448", 2, 2, "", methodObject ),
|
||||
new Among ( "\u0449", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044E\u0449", 5, 1, "", methodObject ),
|
||||
new Among ( "\u0443\u044E\u0449", 6, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "\u0441\u044C", -1, 1, "", this),
|
||||
new Among ( "\u0441\u044F", -1, 1, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "\u0441\u044C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0441\u044F", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "\u043B\u0430", -1, 1, "", this),
|
||||
new Among ( "\u0438\u043B\u0430", 0, 2, "", this),
|
||||
new Among ( "\u044B\u043B\u0430", 0, 2, "", this),
|
||||
new Among ( "\u043D\u0430", -1, 1, "", this),
|
||||
new Among ( "\u0435\u043D\u0430", 3, 2, "", this),
|
||||
new Among ( "\u0435\u0442\u0435", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0442\u0435", -1, 2, "", this),
|
||||
new Among ( "\u0439\u0442\u0435", -1, 1, "", this),
|
||||
new Among ( "\u0435\u0439\u0442\u0435", 7, 2, "", this),
|
||||
new Among ( "\u0443\u0439\u0442\u0435", 7, 2, "", this),
|
||||
new Among ( "\u043B\u0438", -1, 1, "", this),
|
||||
new Among ( "\u0438\u043B\u0438", 10, 2, "", this),
|
||||
new Among ( "\u044B\u043B\u0438", 10, 2, "", this),
|
||||
new Among ( "\u0439", -1, 1, "", this),
|
||||
new Among ( "\u0435\u0439", 13, 2, "", this),
|
||||
new Among ( "\u0443\u0439", 13, 2, "", this),
|
||||
new Among ( "\u043B", -1, 1, "", this),
|
||||
new Among ( "\u0438\u043B", 16, 2, "", this),
|
||||
new Among ( "\u044B\u043B", 16, 2, "", this),
|
||||
new Among ( "\u0435\u043C", -1, 1, "", this),
|
||||
new Among ( "\u0438\u043C", -1, 2, "", this),
|
||||
new Among ( "\u044B\u043C", -1, 2, "", this),
|
||||
new Among ( "\u043D", -1, 1, "", this),
|
||||
new Among ( "\u0435\u043D", 22, 2, "", this),
|
||||
new Among ( "\u043B\u043E", -1, 1, "", this),
|
||||
new Among ( "\u0438\u043B\u043E", 24, 2, "", this),
|
||||
new Among ( "\u044B\u043B\u043E", 24, 2, "", this),
|
||||
new Among ( "\u043D\u043E", -1, 1, "", this),
|
||||
new Among ( "\u0435\u043D\u043E", 27, 2, "", this),
|
||||
new Among ( "\u043D\u043D\u043E", 27, 1, "", this),
|
||||
new Among ( "\u0435\u0442", -1, 1, "", this),
|
||||
new Among ( "\u0443\u0435\u0442", 30, 2, "", this),
|
||||
new Among ( "\u0438\u0442", -1, 2, "", this),
|
||||
new Among ( "\u044B\u0442", -1, 2, "", this),
|
||||
new Among ( "\u044E\u0442", -1, 1, "", this),
|
||||
new Among ( "\u0443\u044E\u0442", 34, 2, "", this),
|
||||
new Among ( "\u044F\u0442", -1, 2, "", this),
|
||||
new Among ( "\u043D\u044B", -1, 1, "", this),
|
||||
new Among ( "\u0435\u043D\u044B", 37, 2, "", this),
|
||||
new Among ( "\u0442\u044C", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0442\u044C", 39, 2, "", this),
|
||||
new Among ( "\u044B\u0442\u044C", 39, 2, "", this),
|
||||
new Among ( "\u0435\u0448\u044C", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0448\u044C", -1, 2, "", this),
|
||||
new Among ( "\u044E", -1, 2, "", this),
|
||||
new Among ( "\u0443\u044E", 44, 2, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "\u043B\u0430", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u043B\u0430", 0, 2, "", methodObject ),
|
||||
new Among ( "\u044B\u043B\u0430", 0, 2, "", methodObject ),
|
||||
new Among ( "\u043D\u0430", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u043D\u0430", 3, 2, "", methodObject ),
|
||||
new Among ( "\u0435\u0442\u0435", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0442\u0435", -1, 2, "", methodObject ),
|
||||
new Among ( "\u0439\u0442\u0435", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u0439\u0442\u0435", 7, 2, "", methodObject ),
|
||||
new Among ( "\u0443\u0439\u0442\u0435", 7, 2, "", methodObject ),
|
||||
new Among ( "\u043B\u0438", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u043B\u0438", 10, 2, "", methodObject ),
|
||||
new Among ( "\u044B\u043B\u0438", 10, 2, "", methodObject ),
|
||||
new Among ( "\u0439", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u0439", 13, 2, "", methodObject ),
|
||||
new Among ( "\u0443\u0439", 13, 2, "", methodObject ),
|
||||
new Among ( "\u043B", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u043B", 16, 2, "", methodObject ),
|
||||
new Among ( "\u044B\u043B", 16, 2, "", methodObject ),
|
||||
new Among ( "\u0435\u043C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u043C", -1, 2, "", methodObject ),
|
||||
new Among ( "\u044B\u043C", -1, 2, "", methodObject ),
|
||||
new Among ( "\u043D", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u043D", 22, 2, "", methodObject ),
|
||||
new Among ( "\u043B\u043E", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u043B\u043E", 24, 2, "", methodObject ),
|
||||
new Among ( "\u044B\u043B\u043E", 24, 2, "", methodObject ),
|
||||
new Among ( "\u043D\u043E", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u043D\u043E", 27, 2, "", methodObject ),
|
||||
new Among ( "\u043D\u043D\u043E", 27, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u0442", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0443\u0435\u0442", 30, 2, "", methodObject ),
|
||||
new Among ( "\u0438\u0442", -1, 2, "", methodObject ),
|
||||
new Among ( "\u044B\u0442", -1, 2, "", methodObject ),
|
||||
new Among ( "\u044E\u0442", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0443\u044E\u0442", 34, 2, "", methodObject ),
|
||||
new Among ( "\u044F\u0442", -1, 2, "", methodObject ),
|
||||
new Among ( "\u043D\u044B", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u043D\u044B", 37, 2, "", methodObject ),
|
||||
new Among ( "\u0442\u044C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0442\u044C", 39, 2, "", methodObject ),
|
||||
new Among ( "\u044B\u0442\u044C", 39, 2, "", methodObject ),
|
||||
new Among ( "\u0435\u0448\u044C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0448\u044C", -1, 2, "", methodObject ),
|
||||
new Among ( "\u044E", -1, 2, "", methodObject ),
|
||||
new Among ( "\u0443\u044E", 44, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "\u0430", -1, 1, "", this),
|
||||
new Among ( "\u0435\u0432", -1, 1, "", this),
|
||||
new Among ( "\u043E\u0432", -1, 1, "", this),
|
||||
new Among ( "\u0435", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0435", 3, 1, "", this),
|
||||
new Among ( "\u044C\u0435", 3, 1, "", this),
|
||||
new Among ( "\u0438", -1, 1, "", this),
|
||||
new Among ( "\u0435\u0438", 6, 1, "", this),
|
||||
new Among ( "\u0438\u0438", 6, 1, "", this),
|
||||
new Among ( "\u0430\u043C\u0438", 6, 1, "", this),
|
||||
new Among ( "\u044F\u043C\u0438", 6, 1, "", this),
|
||||
new Among ( "\u0438\u044F\u043C\u0438", 10, 1, "", this),
|
||||
new Among ( "\u0439", -1, 1, "", this),
|
||||
new Among ( "\u0435\u0439", 12, 1, "", this),
|
||||
new Among ( "\u0438\u0435\u0439", 13, 1, "", this),
|
||||
new Among ( "\u0438\u0439", 12, 1, "", this),
|
||||
new Among ( "\u043E\u0439", 12, 1, "", this),
|
||||
new Among ( "\u0430\u043C", -1, 1, "", this),
|
||||
new Among ( "\u0435\u043C", -1, 1, "", this),
|
||||
new Among ( "\u0438\u0435\u043C", 18, 1, "", this),
|
||||
new Among ( "\u043E\u043C", -1, 1, "", this),
|
||||
new Among ( "\u044F\u043C", -1, 1, "", this),
|
||||
new Among ( "\u0438\u044F\u043C", 21, 1, "", this),
|
||||
new Among ( "\u043E", -1, 1, "", this),
|
||||
new Among ( "\u0443", -1, 1, "", this),
|
||||
new Among ( "\u0430\u0445", -1, 1, "", this),
|
||||
new Among ( "\u044F\u0445", -1, 1, "", this),
|
||||
new Among ( "\u0438\u044F\u0445", 26, 1, "", this),
|
||||
new Among ( "\u044B", -1, 1, "", this),
|
||||
new Among ( "\u044C", -1, 1, "", this),
|
||||
new Among ( "\u044E", -1, 1, "", this),
|
||||
new Among ( "\u0438\u044E", 30, 1, "", this),
|
||||
new Among ( "\u044C\u044E", 30, 1, "", this),
|
||||
new Among ( "\u044F", -1, 1, "", this),
|
||||
new Among ( "\u0438\u044F", 33, 1, "", this),
|
||||
new Among ( "\u044C\u044F", 33, 1, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "\u0430", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u0432", -1, 1, "", methodObject ),
|
||||
new Among ( "\u043E\u0432", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0435", 3, 1, "", methodObject ),
|
||||
new Among ( "\u044C\u0435", 3, 1, "", methodObject ),
|
||||
new Among ( "\u0438", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u0438", 6, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0438", 6, 1, "", methodObject ),
|
||||
new Among ( "\u0430\u043C\u0438", 6, 1, "", methodObject ),
|
||||
new Among ( "\u044F\u043C\u0438", 6, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u044F\u043C\u0438", 10, 1, "", methodObject ),
|
||||
new Among ( "\u0439", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u0439", 12, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0435\u0439", 13, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0439", 12, 1, "", methodObject ),
|
||||
new Among ( "\u043E\u0439", 12, 1, "", methodObject ),
|
||||
new Among ( "\u0430\u043C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0435\u043C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u0435\u043C", 18, 1, "", methodObject ),
|
||||
new Among ( "\u043E\u043C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044F\u043C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u044F\u043C", 21, 1, "", methodObject ),
|
||||
new Among ( "\u043E", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0443", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0430\u0445", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044F\u0445", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u044F\u0445", 26, 1, "", methodObject ),
|
||||
new Among ( "\u044B", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044C", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044E", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u044E", 30, 1, "", methodObject ),
|
||||
new Among ( "\u044C\u044E", 30, 1, "", methodObject ),
|
||||
new Among ( "\u044F", -1, 1, "", methodObject ),
|
||||
new Among ( "\u0438\u044F", 33, 1, "", methodObject ),
|
||||
new Among ( "\u044C\u044F", 33, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_6[] = {
|
||||
new Among ( "\u043E\u0441\u0442", -1, 1, "", this),
|
||||
new Among ( "\u043E\u0441\u0442\u044C", -1, 1, "", this)
|
||||
private final static Among a_6[] = {
|
||||
new Among ( "\u043E\u0441\u0442", -1, 1, "", methodObject ),
|
||||
new Among ( "\u043E\u0441\u0442\u044C", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_7[] = {
|
||||
new Among ( "\u0435\u0439\u0448\u0435", -1, 1, "", this),
|
||||
new Among ( "\u043D", -1, 2, "", this),
|
||||
new Among ( "\u0435\u0439\u0448", -1, 1, "", this),
|
||||
new Among ( "\u044C", -1, 3, "", this)
|
||||
private final static Among a_7[] = {
|
||||
new Among ( "\u0435\u0439\u0448\u0435", -1, 1, "", methodObject ),
|
||||
new Among ( "\u043D", -1, 2, "", methodObject ),
|
||||
new Among ( "\u0435\u0439\u0448", -1, 1, "", methodObject ),
|
||||
new Among ( "\u044C", -1, 3, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {33, 65, 8, 232 };
|
||||
|
@ -723,5 +730,15 @@ public class RussianStemmer extends SnowballProgram {
|
|||
cursor = limit_backward; return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof RussianStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return RussianStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,244 +1,251 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class SpanishStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "", -1, 6, "", this),
|
||||
new Among ( "\u00E1", 0, 1, "", this),
|
||||
new Among ( "\u00E9", 0, 2, "", this),
|
||||
new Among ( "\u00ED", 0, 3, "", this),
|
||||
new Among ( "\u00F3", 0, 4, "", this),
|
||||
new Among ( "\u00FA", 0, 5, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static SpanishStemmer methodObject = new SpanishStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "", -1, 6, "", methodObject ),
|
||||
new Among ( "\u00E1", 0, 1, "", methodObject ),
|
||||
new Among ( "\u00E9", 0, 2, "", methodObject ),
|
||||
new Among ( "\u00ED", 0, 3, "", methodObject ),
|
||||
new Among ( "\u00F3", 0, 4, "", methodObject ),
|
||||
new Among ( "\u00FA", 0, 5, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "la", -1, -1, "", this),
|
||||
new Among ( "sela", 0, -1, "", this),
|
||||
new Among ( "le", -1, -1, "", this),
|
||||
new Among ( "me", -1, -1, "", this),
|
||||
new Among ( "se", -1, -1, "", this),
|
||||
new Among ( "lo", -1, -1, "", this),
|
||||
new Among ( "selo", 5, -1, "", this),
|
||||
new Among ( "las", -1, -1, "", this),
|
||||
new Among ( "selas", 7, -1, "", this),
|
||||
new Among ( "les", -1, -1, "", this),
|
||||
new Among ( "los", -1, -1, "", this),
|
||||
new Among ( "selos", 10, -1, "", this),
|
||||
new Among ( "nos", -1, -1, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "la", -1, -1, "", methodObject ),
|
||||
new Among ( "sela", 0, -1, "", methodObject ),
|
||||
new Among ( "le", -1, -1, "", methodObject ),
|
||||
new Among ( "me", -1, -1, "", methodObject ),
|
||||
new Among ( "se", -1, -1, "", methodObject ),
|
||||
new Among ( "lo", -1, -1, "", methodObject ),
|
||||
new Among ( "selo", 5, -1, "", methodObject ),
|
||||
new Among ( "las", -1, -1, "", methodObject ),
|
||||
new Among ( "selas", 7, -1, "", methodObject ),
|
||||
new Among ( "les", -1, -1, "", methodObject ),
|
||||
new Among ( "los", -1, -1, "", methodObject ),
|
||||
new Among ( "selos", 10, -1, "", methodObject ),
|
||||
new Among ( "nos", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "ando", -1, 6, "", this),
|
||||
new Among ( "iendo", -1, 6, "", this),
|
||||
new Among ( "yendo", -1, 7, "", this),
|
||||
new Among ( "\u00E1ndo", -1, 2, "", this),
|
||||
new Among ( "i\u00E9ndo", -1, 1, "", this),
|
||||
new Among ( "ar", -1, 6, "", this),
|
||||
new Among ( "er", -1, 6, "", this),
|
||||
new Among ( "ir", -1, 6, "", this),
|
||||
new Among ( "\u00E1r", -1, 3, "", this),
|
||||
new Among ( "\u00E9r", -1, 4, "", this),
|
||||
new Among ( "\u00EDr", -1, 5, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "ando", -1, 6, "", methodObject ),
|
||||
new Among ( "iendo", -1, 6, "", methodObject ),
|
||||
new Among ( "yendo", -1, 7, "", methodObject ),
|
||||
new Among ( "\u00E1ndo", -1, 2, "", methodObject ),
|
||||
new Among ( "i\u00E9ndo", -1, 1, "", methodObject ),
|
||||
new Among ( "ar", -1, 6, "", methodObject ),
|
||||
new Among ( "er", -1, 6, "", methodObject ),
|
||||
new Among ( "ir", -1, 6, "", methodObject ),
|
||||
new Among ( "\u00E1r", -1, 3, "", methodObject ),
|
||||
new Among ( "\u00E9r", -1, 4, "", methodObject ),
|
||||
new Among ( "\u00EDr", -1, 5, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "ic", -1, -1, "", this),
|
||||
new Among ( "ad", -1, -1, "", this),
|
||||
new Among ( "os", -1, -1, "", this),
|
||||
new Among ( "iv", -1, 1, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "ic", -1, -1, "", methodObject ),
|
||||
new Among ( "ad", -1, -1, "", methodObject ),
|
||||
new Among ( "os", -1, -1, "", methodObject ),
|
||||
new Among ( "iv", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "able", -1, 1, "", this),
|
||||
new Among ( "ible", -1, 1, "", this),
|
||||
new Among ( "ante", -1, 1, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "able", -1, 1, "", methodObject ),
|
||||
new Among ( "ible", -1, 1, "", methodObject ),
|
||||
new Among ( "ante", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "ic", -1, 1, "", this),
|
||||
new Among ( "abil", -1, 1, "", this),
|
||||
new Among ( "iv", -1, 1, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "ic", -1, 1, "", methodObject ),
|
||||
new Among ( "abil", -1, 1, "", methodObject ),
|
||||
new Among ( "iv", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_6[] = {
|
||||
new Among ( "ica", -1, 1, "", this),
|
||||
new Among ( "ancia", -1, 2, "", this),
|
||||
new Among ( "encia", -1, 5, "", this),
|
||||
new Among ( "adora", -1, 2, "", this),
|
||||
new Among ( "osa", -1, 1, "", this),
|
||||
new Among ( "ista", -1, 1, "", this),
|
||||
new Among ( "iva", -1, 9, "", this),
|
||||
new Among ( "anza", -1, 1, "", this),
|
||||
new Among ( "log\u00EDa", -1, 3, "", this),
|
||||
new Among ( "idad", -1, 8, "", this),
|
||||
new Among ( "able", -1, 1, "", this),
|
||||
new Among ( "ible", -1, 1, "", this),
|
||||
new Among ( "ante", -1, 2, "", this),
|
||||
new Among ( "mente", -1, 7, "", this),
|
||||
new Among ( "amente", 13, 6, "", this),
|
||||
new Among ( "aci\u00F3n", -1, 2, "", this),
|
||||
new Among ( "uci\u00F3n", -1, 4, "", this),
|
||||
new Among ( "ico", -1, 1, "", this),
|
||||
new Among ( "ismo", -1, 1, "", this),
|
||||
new Among ( "oso", -1, 1, "", this),
|
||||
new Among ( "amiento", -1, 1, "", this),
|
||||
new Among ( "imiento", -1, 1, "", this),
|
||||
new Among ( "ivo", -1, 9, "", this),
|
||||
new Among ( "ador", -1, 2, "", this),
|
||||
new Among ( "icas", -1, 1, "", this),
|
||||
new Among ( "ancias", -1, 2, "", this),
|
||||
new Among ( "encias", -1, 5, "", this),
|
||||
new Among ( "adoras", -1, 2, "", this),
|
||||
new Among ( "osas", -1, 1, "", this),
|
||||
new Among ( "istas", -1, 1, "", this),
|
||||
new Among ( "ivas", -1, 9, "", this),
|
||||
new Among ( "anzas", -1, 1, "", this),
|
||||
new Among ( "log\u00EDas", -1, 3, "", this),
|
||||
new Among ( "idades", -1, 8, "", this),
|
||||
new Among ( "ables", -1, 1, "", this),
|
||||
new Among ( "ibles", -1, 1, "", this),
|
||||
new Among ( "aciones", -1, 2, "", this),
|
||||
new Among ( "uciones", -1, 4, "", this),
|
||||
new Among ( "adores", -1, 2, "", this),
|
||||
new Among ( "antes", -1, 2, "", this),
|
||||
new Among ( "icos", -1, 1, "", this),
|
||||
new Among ( "ismos", -1, 1, "", this),
|
||||
new Among ( "osos", -1, 1, "", this),
|
||||
new Among ( "amientos", -1, 1, "", this),
|
||||
new Among ( "imientos", -1, 1, "", this),
|
||||
new Among ( "ivos", -1, 9, "", this)
|
||||
private final static Among a_6[] = {
|
||||
new Among ( "ica", -1, 1, "", methodObject ),
|
||||
new Among ( "ancia", -1, 2, "", methodObject ),
|
||||
new Among ( "encia", -1, 5, "", methodObject ),
|
||||
new Among ( "adora", -1, 2, "", methodObject ),
|
||||
new Among ( "osa", -1, 1, "", methodObject ),
|
||||
new Among ( "ista", -1, 1, "", methodObject ),
|
||||
new Among ( "iva", -1, 9, "", methodObject ),
|
||||
new Among ( "anza", -1, 1, "", methodObject ),
|
||||
new Among ( "log\u00EDa", -1, 3, "", methodObject ),
|
||||
new Among ( "idad", -1, 8, "", methodObject ),
|
||||
new Among ( "able", -1, 1, "", methodObject ),
|
||||
new Among ( "ible", -1, 1, "", methodObject ),
|
||||
new Among ( "ante", -1, 2, "", methodObject ),
|
||||
new Among ( "mente", -1, 7, "", methodObject ),
|
||||
new Among ( "amente", 13, 6, "", methodObject ),
|
||||
new Among ( "aci\u00F3n", -1, 2, "", methodObject ),
|
||||
new Among ( "uci\u00F3n", -1, 4, "", methodObject ),
|
||||
new Among ( "ico", -1, 1, "", methodObject ),
|
||||
new Among ( "ismo", -1, 1, "", methodObject ),
|
||||
new Among ( "oso", -1, 1, "", methodObject ),
|
||||
new Among ( "amiento", -1, 1, "", methodObject ),
|
||||
new Among ( "imiento", -1, 1, "", methodObject ),
|
||||
new Among ( "ivo", -1, 9, "", methodObject ),
|
||||
new Among ( "ador", -1, 2, "", methodObject ),
|
||||
new Among ( "icas", -1, 1, "", methodObject ),
|
||||
new Among ( "ancias", -1, 2, "", methodObject ),
|
||||
new Among ( "encias", -1, 5, "", methodObject ),
|
||||
new Among ( "adoras", -1, 2, "", methodObject ),
|
||||
new Among ( "osas", -1, 1, "", methodObject ),
|
||||
new Among ( "istas", -1, 1, "", methodObject ),
|
||||
new Among ( "ivas", -1, 9, "", methodObject ),
|
||||
new Among ( "anzas", -1, 1, "", methodObject ),
|
||||
new Among ( "log\u00EDas", -1, 3, "", methodObject ),
|
||||
new Among ( "idades", -1, 8, "", methodObject ),
|
||||
new Among ( "ables", -1, 1, "", methodObject ),
|
||||
new Among ( "ibles", -1, 1, "", methodObject ),
|
||||
new Among ( "aciones", -1, 2, "", methodObject ),
|
||||
new Among ( "uciones", -1, 4, "", methodObject ),
|
||||
new Among ( "adores", -1, 2, "", methodObject ),
|
||||
new Among ( "antes", -1, 2, "", methodObject ),
|
||||
new Among ( "icos", -1, 1, "", methodObject ),
|
||||
new Among ( "ismos", -1, 1, "", methodObject ),
|
||||
new Among ( "osos", -1, 1, "", methodObject ),
|
||||
new Among ( "amientos", -1, 1, "", methodObject ),
|
||||
new Among ( "imientos", -1, 1, "", methodObject ),
|
||||
new Among ( "ivos", -1, 9, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_7[] = {
|
||||
new Among ( "ya", -1, 1, "", this),
|
||||
new Among ( "ye", -1, 1, "", this),
|
||||
new Among ( "yan", -1, 1, "", this),
|
||||
new Among ( "yen", -1, 1, "", this),
|
||||
new Among ( "yeron", -1, 1, "", this),
|
||||
new Among ( "yendo", -1, 1, "", this),
|
||||
new Among ( "yo", -1, 1, "", this),
|
||||
new Among ( "yas", -1, 1, "", this),
|
||||
new Among ( "yes", -1, 1, "", this),
|
||||
new Among ( "yais", -1, 1, "", this),
|
||||
new Among ( "yamos", -1, 1, "", this),
|
||||
new Among ( "y\u00F3", -1, 1, "", this)
|
||||
private final static Among a_7[] = {
|
||||
new Among ( "ya", -1, 1, "", methodObject ),
|
||||
new Among ( "ye", -1, 1, "", methodObject ),
|
||||
new Among ( "yan", -1, 1, "", methodObject ),
|
||||
new Among ( "yen", -1, 1, "", methodObject ),
|
||||
new Among ( "yeron", -1, 1, "", methodObject ),
|
||||
new Among ( "yendo", -1, 1, "", methodObject ),
|
||||
new Among ( "yo", -1, 1, "", methodObject ),
|
||||
new Among ( "yas", -1, 1, "", methodObject ),
|
||||
new Among ( "yes", -1, 1, "", methodObject ),
|
||||
new Among ( "yais", -1, 1, "", methodObject ),
|
||||
new Among ( "yamos", -1, 1, "", methodObject ),
|
||||
new Among ( "y\u00F3", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_8[] = {
|
||||
new Among ( "aba", -1, 2, "", this),
|
||||
new Among ( "ada", -1, 2, "", this),
|
||||
new Among ( "ida", -1, 2, "", this),
|
||||
new Among ( "ara", -1, 2, "", this),
|
||||
new Among ( "iera", -1, 2, "", this),
|
||||
new Among ( "\u00EDa", -1, 2, "", this),
|
||||
new Among ( "ar\u00EDa", 5, 2, "", this),
|
||||
new Among ( "er\u00EDa", 5, 2, "", this),
|
||||
new Among ( "ir\u00EDa", 5, 2, "", this),
|
||||
new Among ( "ad", -1, 2, "", this),
|
||||
new Among ( "ed", -1, 2, "", this),
|
||||
new Among ( "id", -1, 2, "", this),
|
||||
new Among ( "ase", -1, 2, "", this),
|
||||
new Among ( "iese", -1, 2, "", this),
|
||||
new Among ( "aste", -1, 2, "", this),
|
||||
new Among ( "iste", -1, 2, "", this),
|
||||
new Among ( "an", -1, 2, "", this),
|
||||
new Among ( "aban", 16, 2, "", this),
|
||||
new Among ( "aran", 16, 2, "", this),
|
||||
new Among ( "ieran", 16, 2, "", this),
|
||||
new Among ( "\u00EDan", 16, 2, "", this),
|
||||
new Among ( "ar\u00EDan", 20, 2, "", this),
|
||||
new Among ( "er\u00EDan", 20, 2, "", this),
|
||||
new Among ( "ir\u00EDan", 20, 2, "", this),
|
||||
new Among ( "en", -1, 1, "", this),
|
||||
new Among ( "asen", 24, 2, "", this),
|
||||
new Among ( "iesen", 24, 2, "", this),
|
||||
new Among ( "aron", -1, 2, "", this),
|
||||
new Among ( "ieron", -1, 2, "", this),
|
||||
new Among ( "ar\u00E1n", -1, 2, "", this),
|
||||
new Among ( "er\u00E1n", -1, 2, "", this),
|
||||
new Among ( "ir\u00E1n", -1, 2, "", this),
|
||||
new Among ( "ado", -1, 2, "", this),
|
||||
new Among ( "ido", -1, 2, "", this),
|
||||
new Among ( "ando", -1, 2, "", this),
|
||||
new Among ( "iendo", -1, 2, "", this),
|
||||
new Among ( "ar", -1, 2, "", this),
|
||||
new Among ( "er", -1, 2, "", this),
|
||||
new Among ( "ir", -1, 2, "", this),
|
||||
new Among ( "as", -1, 2, "", this),
|
||||
new Among ( "abas", 39, 2, "", this),
|
||||
new Among ( "adas", 39, 2, "", this),
|
||||
new Among ( "idas", 39, 2, "", this),
|
||||
new Among ( "aras", 39, 2, "", this),
|
||||
new Among ( "ieras", 39, 2, "", this),
|
||||
new Among ( "\u00EDas", 39, 2, "", this),
|
||||
new Among ( "ar\u00EDas", 45, 2, "", this),
|
||||
new Among ( "er\u00EDas", 45, 2, "", this),
|
||||
new Among ( "ir\u00EDas", 45, 2, "", this),
|
||||
new Among ( "es", -1, 1, "", this),
|
||||
new Among ( "ases", 49, 2, "", this),
|
||||
new Among ( "ieses", 49, 2, "", this),
|
||||
new Among ( "abais", -1, 2, "", this),
|
||||
new Among ( "arais", -1, 2, "", this),
|
||||
new Among ( "ierais", -1, 2, "", this),
|
||||
new Among ( "\u00EDais", -1, 2, "", this),
|
||||
new Among ( "ar\u00EDais", 55, 2, "", this),
|
||||
new Among ( "er\u00EDais", 55, 2, "", this),
|
||||
new Among ( "ir\u00EDais", 55, 2, "", this),
|
||||
new Among ( "aseis", -1, 2, "", this),
|
||||
new Among ( "ieseis", -1, 2, "", this),
|
||||
new Among ( "asteis", -1, 2, "", this),
|
||||
new Among ( "isteis", -1, 2, "", this),
|
||||
new Among ( "\u00E1is", -1, 2, "", this),
|
||||
new Among ( "\u00E9is", -1, 1, "", this),
|
||||
new Among ( "ar\u00E9is", 64, 2, "", this),
|
||||
new Among ( "er\u00E9is", 64, 2, "", this),
|
||||
new Among ( "ir\u00E9is", 64, 2, "", this),
|
||||
new Among ( "ados", -1, 2, "", this),
|
||||
new Among ( "idos", -1, 2, "", this),
|
||||
new Among ( "amos", -1, 2, "", this),
|
||||
new Among ( "\u00E1bamos", 70, 2, "", this),
|
||||
new Among ( "\u00E1ramos", 70, 2, "", this),
|
||||
new Among ( "i\u00E9ramos", 70, 2, "", this),
|
||||
new Among ( "\u00EDamos", 70, 2, "", this),
|
||||
new Among ( "ar\u00EDamos", 74, 2, "", this),
|
||||
new Among ( "er\u00EDamos", 74, 2, "", this),
|
||||
new Among ( "ir\u00EDamos", 74, 2, "", this),
|
||||
new Among ( "emos", -1, 1, "", this),
|
||||
new Among ( "aremos", 78, 2, "", this),
|
||||
new Among ( "eremos", 78, 2, "", this),
|
||||
new Among ( "iremos", 78, 2, "", this),
|
||||
new Among ( "\u00E1semos", 78, 2, "", this),
|
||||
new Among ( "i\u00E9semos", 78, 2, "", this),
|
||||
new Among ( "imos", -1, 2, "", this),
|
||||
new Among ( "ar\u00E1s", -1, 2, "", this),
|
||||
new Among ( "er\u00E1s", -1, 2, "", this),
|
||||
new Among ( "ir\u00E1s", -1, 2, "", this),
|
||||
new Among ( "\u00EDs", -1, 2, "", this),
|
||||
new Among ( "ar\u00E1", -1, 2, "", this),
|
||||
new Among ( "er\u00E1", -1, 2, "", this),
|
||||
new Among ( "ir\u00E1", -1, 2, "", this),
|
||||
new Among ( "ar\u00E9", -1, 2, "", this),
|
||||
new Among ( "er\u00E9", -1, 2, "", this),
|
||||
new Among ( "ir\u00E9", -1, 2, "", this),
|
||||
new Among ( "i\u00F3", -1, 2, "", this)
|
||||
private final static Among a_8[] = {
|
||||
new Among ( "aba", -1, 2, "", methodObject ),
|
||||
new Among ( "ada", -1, 2, "", methodObject ),
|
||||
new Among ( "ida", -1, 2, "", methodObject ),
|
||||
new Among ( "ara", -1, 2, "", methodObject ),
|
||||
new Among ( "iera", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00EDa", -1, 2, "", methodObject ),
|
||||
new Among ( "ar\u00EDa", 5, 2, "", methodObject ),
|
||||
new Among ( "er\u00EDa", 5, 2, "", methodObject ),
|
||||
new Among ( "ir\u00EDa", 5, 2, "", methodObject ),
|
||||
new Among ( "ad", -1, 2, "", methodObject ),
|
||||
new Among ( "ed", -1, 2, "", methodObject ),
|
||||
new Among ( "id", -1, 2, "", methodObject ),
|
||||
new Among ( "ase", -1, 2, "", methodObject ),
|
||||
new Among ( "iese", -1, 2, "", methodObject ),
|
||||
new Among ( "aste", -1, 2, "", methodObject ),
|
||||
new Among ( "iste", -1, 2, "", methodObject ),
|
||||
new Among ( "an", -1, 2, "", methodObject ),
|
||||
new Among ( "aban", 16, 2, "", methodObject ),
|
||||
new Among ( "aran", 16, 2, "", methodObject ),
|
||||
new Among ( "ieran", 16, 2, "", methodObject ),
|
||||
new Among ( "\u00EDan", 16, 2, "", methodObject ),
|
||||
new Among ( "ar\u00EDan", 20, 2, "", methodObject ),
|
||||
new Among ( "er\u00EDan", 20, 2, "", methodObject ),
|
||||
new Among ( "ir\u00EDan", 20, 2, "", methodObject ),
|
||||
new Among ( "en", -1, 1, "", methodObject ),
|
||||
new Among ( "asen", 24, 2, "", methodObject ),
|
||||
new Among ( "iesen", 24, 2, "", methodObject ),
|
||||
new Among ( "aron", -1, 2, "", methodObject ),
|
||||
new Among ( "ieron", -1, 2, "", methodObject ),
|
||||
new Among ( "ar\u00E1n", -1, 2, "", methodObject ),
|
||||
new Among ( "er\u00E1n", -1, 2, "", methodObject ),
|
||||
new Among ( "ir\u00E1n", -1, 2, "", methodObject ),
|
||||
new Among ( "ado", -1, 2, "", methodObject ),
|
||||
new Among ( "ido", -1, 2, "", methodObject ),
|
||||
new Among ( "ando", -1, 2, "", methodObject ),
|
||||
new Among ( "iendo", -1, 2, "", methodObject ),
|
||||
new Among ( "ar", -1, 2, "", methodObject ),
|
||||
new Among ( "er", -1, 2, "", methodObject ),
|
||||
new Among ( "ir", -1, 2, "", methodObject ),
|
||||
new Among ( "as", -1, 2, "", methodObject ),
|
||||
new Among ( "abas", 39, 2, "", methodObject ),
|
||||
new Among ( "adas", 39, 2, "", methodObject ),
|
||||
new Among ( "idas", 39, 2, "", methodObject ),
|
||||
new Among ( "aras", 39, 2, "", methodObject ),
|
||||
new Among ( "ieras", 39, 2, "", methodObject ),
|
||||
new Among ( "\u00EDas", 39, 2, "", methodObject ),
|
||||
new Among ( "ar\u00EDas", 45, 2, "", methodObject ),
|
||||
new Among ( "er\u00EDas", 45, 2, "", methodObject ),
|
||||
new Among ( "ir\u00EDas", 45, 2, "", methodObject ),
|
||||
new Among ( "es", -1, 1, "", methodObject ),
|
||||
new Among ( "ases", 49, 2, "", methodObject ),
|
||||
new Among ( "ieses", 49, 2, "", methodObject ),
|
||||
new Among ( "abais", -1, 2, "", methodObject ),
|
||||
new Among ( "arais", -1, 2, "", methodObject ),
|
||||
new Among ( "ierais", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00EDais", -1, 2, "", methodObject ),
|
||||
new Among ( "ar\u00EDais", 55, 2, "", methodObject ),
|
||||
new Among ( "er\u00EDais", 55, 2, "", methodObject ),
|
||||
new Among ( "ir\u00EDais", 55, 2, "", methodObject ),
|
||||
new Among ( "aseis", -1, 2, "", methodObject ),
|
||||
new Among ( "ieseis", -1, 2, "", methodObject ),
|
||||
new Among ( "asteis", -1, 2, "", methodObject ),
|
||||
new Among ( "isteis", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00E1is", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00E9is", -1, 1, "", methodObject ),
|
||||
new Among ( "ar\u00E9is", 64, 2, "", methodObject ),
|
||||
new Among ( "er\u00E9is", 64, 2, "", methodObject ),
|
||||
new Among ( "ir\u00E9is", 64, 2, "", methodObject ),
|
||||
new Among ( "ados", -1, 2, "", methodObject ),
|
||||
new Among ( "idos", -1, 2, "", methodObject ),
|
||||
new Among ( "amos", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00E1bamos", 70, 2, "", methodObject ),
|
||||
new Among ( "\u00E1ramos", 70, 2, "", methodObject ),
|
||||
new Among ( "i\u00E9ramos", 70, 2, "", methodObject ),
|
||||
new Among ( "\u00EDamos", 70, 2, "", methodObject ),
|
||||
new Among ( "ar\u00EDamos", 74, 2, "", methodObject ),
|
||||
new Among ( "er\u00EDamos", 74, 2, "", methodObject ),
|
||||
new Among ( "ir\u00EDamos", 74, 2, "", methodObject ),
|
||||
new Among ( "emos", -1, 1, "", methodObject ),
|
||||
new Among ( "aremos", 78, 2, "", methodObject ),
|
||||
new Among ( "eremos", 78, 2, "", methodObject ),
|
||||
new Among ( "iremos", 78, 2, "", methodObject ),
|
||||
new Among ( "\u00E1semos", 78, 2, "", methodObject ),
|
||||
new Among ( "i\u00E9semos", 78, 2, "", methodObject ),
|
||||
new Among ( "imos", -1, 2, "", methodObject ),
|
||||
new Among ( "ar\u00E1s", -1, 2, "", methodObject ),
|
||||
new Among ( "er\u00E1s", -1, 2, "", methodObject ),
|
||||
new Among ( "ir\u00E1s", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00EDs", -1, 2, "", methodObject ),
|
||||
new Among ( "ar\u00E1", -1, 2, "", methodObject ),
|
||||
new Among ( "er\u00E1", -1, 2, "", methodObject ),
|
||||
new Among ( "ir\u00E1", -1, 2, "", methodObject ),
|
||||
new Among ( "ar\u00E9", -1, 2, "", methodObject ),
|
||||
new Among ( "er\u00E9", -1, 2, "", methodObject ),
|
||||
new Among ( "ir\u00E9", -1, 2, "", methodObject ),
|
||||
new Among ( "i\u00F3", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_9[] = {
|
||||
new Among ( "a", -1, 1, "", this),
|
||||
new Among ( "e", -1, 2, "", this),
|
||||
new Among ( "o", -1, 1, "", this),
|
||||
new Among ( "os", -1, 1, "", this),
|
||||
new Among ( "\u00E1", -1, 1, "", this),
|
||||
new Among ( "\u00E9", -1, 2, "", this),
|
||||
new Among ( "\u00ED", -1, 1, "", this),
|
||||
new Among ( "\u00F3", -1, 1, "", this)
|
||||
private final static Among a_9[] = {
|
||||
new Among ( "a", -1, 1, "", methodObject ),
|
||||
new Among ( "e", -1, 2, "", methodObject ),
|
||||
new Among ( "o", -1, 1, "", methodObject ),
|
||||
new Among ( "os", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E1", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00E9", -1, 2, "", methodObject ),
|
||||
new Among ( "\u00ED", -1, 1, "", methodObject ),
|
||||
new Among ( "\u00F3", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 1, 17, 4, 10 };
|
||||
|
@ -1178,5 +1185,15 @@ public class SpanishStemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof SpanishStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return SpanishStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,70 +1,77 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class SwedishStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "a", -1, 1, "", this),
|
||||
new Among ( "arna", 0, 1, "", this),
|
||||
new Among ( "erna", 0, 1, "", this),
|
||||
new Among ( "heterna", 2, 1, "", this),
|
||||
new Among ( "orna", 0, 1, "", this),
|
||||
new Among ( "ad", -1, 1, "", this),
|
||||
new Among ( "e", -1, 1, "", this),
|
||||
new Among ( "ade", 6, 1, "", this),
|
||||
new Among ( "ande", 6, 1, "", this),
|
||||
new Among ( "arne", 6, 1, "", this),
|
||||
new Among ( "are", 6, 1, "", this),
|
||||
new Among ( "aste", 6, 1, "", this),
|
||||
new Among ( "en", -1, 1, "", this),
|
||||
new Among ( "anden", 12, 1, "", this),
|
||||
new Among ( "aren", 12, 1, "", this),
|
||||
new Among ( "heten", 12, 1, "", this),
|
||||
new Among ( "ern", -1, 1, "", this),
|
||||
new Among ( "ar", -1, 1, "", this),
|
||||
new Among ( "er", -1, 1, "", this),
|
||||
new Among ( "heter", 18, 1, "", this),
|
||||
new Among ( "or", -1, 1, "", this),
|
||||
new Among ( "s", -1, 2, "", this),
|
||||
new Among ( "as", 21, 1, "", this),
|
||||
new Among ( "arnas", 22, 1, "", this),
|
||||
new Among ( "ernas", 22, 1, "", this),
|
||||
new Among ( "ornas", 22, 1, "", this),
|
||||
new Among ( "es", 21, 1, "", this),
|
||||
new Among ( "ades", 26, 1, "", this),
|
||||
new Among ( "andes", 26, 1, "", this),
|
||||
new Among ( "ens", 21, 1, "", this),
|
||||
new Among ( "arens", 29, 1, "", this),
|
||||
new Among ( "hetens", 29, 1, "", this),
|
||||
new Among ( "erns", 21, 1, "", this),
|
||||
new Among ( "at", -1, 1, "", this),
|
||||
new Among ( "andet", -1, 1, "", this),
|
||||
new Among ( "het", -1, 1, "", this),
|
||||
new Among ( "ast", -1, 1, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static SwedishStemmer methodObject = new SwedishStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "a", -1, 1, "", methodObject ),
|
||||
new Among ( "arna", 0, 1, "", methodObject ),
|
||||
new Among ( "erna", 0, 1, "", methodObject ),
|
||||
new Among ( "heterna", 2, 1, "", methodObject ),
|
||||
new Among ( "orna", 0, 1, "", methodObject ),
|
||||
new Among ( "ad", -1, 1, "", methodObject ),
|
||||
new Among ( "e", -1, 1, "", methodObject ),
|
||||
new Among ( "ade", 6, 1, "", methodObject ),
|
||||
new Among ( "ande", 6, 1, "", methodObject ),
|
||||
new Among ( "arne", 6, 1, "", methodObject ),
|
||||
new Among ( "are", 6, 1, "", methodObject ),
|
||||
new Among ( "aste", 6, 1, "", methodObject ),
|
||||
new Among ( "en", -1, 1, "", methodObject ),
|
||||
new Among ( "anden", 12, 1, "", methodObject ),
|
||||
new Among ( "aren", 12, 1, "", methodObject ),
|
||||
new Among ( "heten", 12, 1, "", methodObject ),
|
||||
new Among ( "ern", -1, 1, "", methodObject ),
|
||||
new Among ( "ar", -1, 1, "", methodObject ),
|
||||
new Among ( "er", -1, 1, "", methodObject ),
|
||||
new Among ( "heter", 18, 1, "", methodObject ),
|
||||
new Among ( "or", -1, 1, "", methodObject ),
|
||||
new Among ( "s", -1, 2, "", methodObject ),
|
||||
new Among ( "as", 21, 1, "", methodObject ),
|
||||
new Among ( "arnas", 22, 1, "", methodObject ),
|
||||
new Among ( "ernas", 22, 1, "", methodObject ),
|
||||
new Among ( "ornas", 22, 1, "", methodObject ),
|
||||
new Among ( "es", 21, 1, "", methodObject ),
|
||||
new Among ( "ades", 26, 1, "", methodObject ),
|
||||
new Among ( "andes", 26, 1, "", methodObject ),
|
||||
new Among ( "ens", 21, 1, "", methodObject ),
|
||||
new Among ( "arens", 29, 1, "", methodObject ),
|
||||
new Among ( "hetens", 29, 1, "", methodObject ),
|
||||
new Among ( "erns", 21, 1, "", methodObject ),
|
||||
new Among ( "at", -1, 1, "", methodObject ),
|
||||
new Among ( "andet", -1, 1, "", methodObject ),
|
||||
new Among ( "het", -1, 1, "", methodObject ),
|
||||
new Among ( "ast", -1, 1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "dd", -1, -1, "", this),
|
||||
new Among ( "gd", -1, -1, "", this),
|
||||
new Among ( "nn", -1, -1, "", this),
|
||||
new Among ( "dt", -1, -1, "", this),
|
||||
new Among ( "gt", -1, -1, "", this),
|
||||
new Among ( "kt", -1, -1, "", this),
|
||||
new Among ( "tt", -1, -1, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "dd", -1, -1, "", methodObject ),
|
||||
new Among ( "gd", -1, -1, "", methodObject ),
|
||||
new Among ( "nn", -1, -1, "", methodObject ),
|
||||
new Among ( "dt", -1, -1, "", methodObject ),
|
||||
new Among ( "gt", -1, -1, "", methodObject ),
|
||||
new Among ( "kt", -1, -1, "", methodObject ),
|
||||
new Among ( "tt", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "ig", -1, 1, "", this),
|
||||
new Among ( "lig", 0, 1, "", this),
|
||||
new Among ( "els", -1, 1, "", this),
|
||||
new Among ( "fullt", -1, 3, "", this),
|
||||
new Among ( "l\u00F6st", -1, 2, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "ig", -1, 1, "", methodObject ),
|
||||
new Among ( "lig", 0, 1, "", methodObject ),
|
||||
new Among ( "els", -1, 1, "", methodObject ),
|
||||
new Among ( "fullt", -1, 3, "", methodObject ),
|
||||
new Among ( "l\u00F6st", -1, 2, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_v[] = {17, 65, 16, 1, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 24, 0, 32 };
|
||||
|
@ -345,5 +352,15 @@ public class SwedishStemmer extends SnowballProgram {
|
|||
cursor = limit_backward; return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof SwedishStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return SwedishStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -1,204 +1,211 @@
|
|||
// This file was generated automatically by the Snowball to Java compiler
|
||||
|
||||
package org.tartarus.snowball.ext;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
import org.tartarus.snowball.Among;
|
||||
|
||||
/**
|
||||
* Generated class implementing code defined by a snowball script.
|
||||
import org.tartarus.snowball.Among;
|
||||
import org.tartarus.snowball.SnowballProgram;
|
||||
|
||||
/**
|
||||
* This class was automatically generated by a Snowball to Java compiler
|
||||
* It implements the stemming algorithm defined by a snowball script.
|
||||
*/
|
||||
|
||||
public class TurkishStemmer extends SnowballProgram {
|
||||
|
||||
private Among a_0[] = {
|
||||
new Among ( "m", -1, -1, "", this),
|
||||
new Among ( "n", -1, -1, "", this),
|
||||
new Among ( "miz", -1, -1, "", this),
|
||||
new Among ( "niz", -1, -1, "", this),
|
||||
new Among ( "muz", -1, -1, "", this),
|
||||
new Among ( "nuz", -1, -1, "", this),
|
||||
new Among ( "m\u00FCz", -1, -1, "", this),
|
||||
new Among ( "n\u00FCz", -1, -1, "", this),
|
||||
new Among ( "m\u0131z", -1, -1, "", this),
|
||||
new Among ( "n\u0131z", -1, -1, "", this)
|
||||
private static final long serialVersionUID = 1L;
|
||||
|
||||
private final static TurkishStemmer methodObject = new TurkishStemmer ();
|
||||
|
||||
private final static Among a_0[] = {
|
||||
new Among ( "m", -1, -1, "", methodObject ),
|
||||
new Among ( "n", -1, -1, "", methodObject ),
|
||||
new Among ( "miz", -1, -1, "", methodObject ),
|
||||
new Among ( "niz", -1, -1, "", methodObject ),
|
||||
new Among ( "muz", -1, -1, "", methodObject ),
|
||||
new Among ( "nuz", -1, -1, "", methodObject ),
|
||||
new Among ( "m\u00FCz", -1, -1, "", methodObject ),
|
||||
new Among ( "n\u00FCz", -1, -1, "", methodObject ),
|
||||
new Among ( "m\u0131z", -1, -1, "", methodObject ),
|
||||
new Among ( "n\u0131z", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_1[] = {
|
||||
new Among ( "leri", -1, -1, "", this),
|
||||
new Among ( "lar\u0131", -1, -1, "", this)
|
||||
private final static Among a_1[] = {
|
||||
new Among ( "leri", -1, -1, "", methodObject ),
|
||||
new Among ( "lar\u0131", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_2[] = {
|
||||
new Among ( "ni", -1, -1, "", this),
|
||||
new Among ( "nu", -1, -1, "", this),
|
||||
new Among ( "n\u00FC", -1, -1, "", this),
|
||||
new Among ( "n\u0131", -1, -1, "", this)
|
||||
private final static Among a_2[] = {
|
||||
new Among ( "ni", -1, -1, "", methodObject ),
|
||||
new Among ( "nu", -1, -1, "", methodObject ),
|
||||
new Among ( "n\u00FC", -1, -1, "", methodObject ),
|
||||
new Among ( "n\u0131", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_3[] = {
|
||||
new Among ( "in", -1, -1, "", this),
|
||||
new Among ( "un", -1, -1, "", this),
|
||||
new Among ( "\u00FCn", -1, -1, "", this),
|
||||
new Among ( "\u0131n", -1, -1, "", this)
|
||||
private final static Among a_3[] = {
|
||||
new Among ( "in", -1, -1, "", methodObject ),
|
||||
new Among ( "un", -1, -1, "", methodObject ),
|
||||
new Among ( "\u00FCn", -1, -1, "", methodObject ),
|
||||
new Among ( "\u0131n", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_4[] = {
|
||||
new Among ( "a", -1, -1, "", this),
|
||||
new Among ( "e", -1, -1, "", this)
|
||||
private final static Among a_4[] = {
|
||||
new Among ( "a", -1, -1, "", methodObject ),
|
||||
new Among ( "e", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_5[] = {
|
||||
new Among ( "na", -1, -1, "", this),
|
||||
new Among ( "ne", -1, -1, "", this)
|
||||
private final static Among a_5[] = {
|
||||
new Among ( "na", -1, -1, "", methodObject ),
|
||||
new Among ( "ne", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_6[] = {
|
||||
new Among ( "da", -1, -1, "", this),
|
||||
new Among ( "ta", -1, -1, "", this),
|
||||
new Among ( "de", -1, -1, "", this),
|
||||
new Among ( "te", -1, -1, "", this)
|
||||
private final static Among a_6[] = {
|
||||
new Among ( "da", -1, -1, "", methodObject ),
|
||||
new Among ( "ta", -1, -1, "", methodObject ),
|
||||
new Among ( "de", -1, -1, "", methodObject ),
|
||||
new Among ( "te", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_7[] = {
|
||||
new Among ( "nda", -1, -1, "", this),
|
||||
new Among ( "nde", -1, -1, "", this)
|
||||
private final static Among a_7[] = {
|
||||
new Among ( "nda", -1, -1, "", methodObject ),
|
||||
new Among ( "nde", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_8[] = {
|
||||
new Among ( "dan", -1, -1, "", this),
|
||||
new Among ( "tan", -1, -1, "", this),
|
||||
new Among ( "den", -1, -1, "", this),
|
||||
new Among ( "ten", -1, -1, "", this)
|
||||
private final static Among a_8[] = {
|
||||
new Among ( "dan", -1, -1, "", methodObject ),
|
||||
new Among ( "tan", -1, -1, "", methodObject ),
|
||||
new Among ( "den", -1, -1, "", methodObject ),
|
||||
new Among ( "ten", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_9[] = {
|
||||
new Among ( "ndan", -1, -1, "", this),
|
||||
new Among ( "nden", -1, -1, "", this)
|
||||
private final static Among a_9[] = {
|
||||
new Among ( "ndan", -1, -1, "", methodObject ),
|
||||
new Among ( "nden", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_10[] = {
|
||||
new Among ( "la", -1, -1, "", this),
|
||||
new Among ( "le", -1, -1, "", this)
|
||||
private final static Among a_10[] = {
|
||||
new Among ( "la", -1, -1, "", methodObject ),
|
||||
new Among ( "le", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_11[] = {
|
||||
new Among ( "ca", -1, -1, "", this),
|
||||
new Among ( "ce", -1, -1, "", this)
|
||||
private final static Among a_11[] = {
|
||||
new Among ( "ca", -1, -1, "", methodObject ),
|
||||
new Among ( "ce", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_12[] = {
|
||||
new Among ( "im", -1, -1, "", this),
|
||||
new Among ( "um", -1, -1, "", this),
|
||||
new Among ( "\u00FCm", -1, -1, "", this),
|
||||
new Among ( "\u0131m", -1, -1, "", this)
|
||||
private final static Among a_12[] = {
|
||||
new Among ( "im", -1, -1, "", methodObject ),
|
||||
new Among ( "um", -1, -1, "", methodObject ),
|
||||
new Among ( "\u00FCm", -1, -1, "", methodObject ),
|
||||
new Among ( "\u0131m", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_13[] = {
|
||||
new Among ( "sin", -1, -1, "", this),
|
||||
new Among ( "sun", -1, -1, "", this),
|
||||
new Among ( "s\u00FCn", -1, -1, "", this),
|
||||
new Among ( "s\u0131n", -1, -1, "", this)
|
||||
private final static Among a_13[] = {
|
||||
new Among ( "sin", -1, -1, "", methodObject ),
|
||||
new Among ( "sun", -1, -1, "", methodObject ),
|
||||
new Among ( "s\u00FCn", -1, -1, "", methodObject ),
|
||||
new Among ( "s\u0131n", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_14[] = {
|
||||
new Among ( "iz", -1, -1, "", this),
|
||||
new Among ( "uz", -1, -1, "", this),
|
||||
new Among ( "\u00FCz", -1, -1, "", this),
|
||||
new Among ( "\u0131z", -1, -1, "", this)
|
||||
private final static Among a_14[] = {
|
||||
new Among ( "iz", -1, -1, "", methodObject ),
|
||||
new Among ( "uz", -1, -1, "", methodObject ),
|
||||
new Among ( "\u00FCz", -1, -1, "", methodObject ),
|
||||
new Among ( "\u0131z", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_15[] = {
|
||||
new Among ( "siniz", -1, -1, "", this),
|
||||
new Among ( "sunuz", -1, -1, "", this),
|
||||
new Among ( "s\u00FCn\u00FCz", -1, -1, "", this),
|
||||
new Among ( "s\u0131n\u0131z", -1, -1, "", this)
|
||||
private final static Among a_15[] = {
|
||||
new Among ( "siniz", -1, -1, "", methodObject ),
|
||||
new Among ( "sunuz", -1, -1, "", methodObject ),
|
||||
new Among ( "s\u00FCn\u00FCz", -1, -1, "", methodObject ),
|
||||
new Among ( "s\u0131n\u0131z", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_16[] = {
|
||||
new Among ( "lar", -1, -1, "", this),
|
||||
new Among ( "ler", -1, -1, "", this)
|
||||
private final static Among a_16[] = {
|
||||
new Among ( "lar", -1, -1, "", methodObject ),
|
||||
new Among ( "ler", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_17[] = {
|
||||
new Among ( "niz", -1, -1, "", this),
|
||||
new Among ( "nuz", -1, -1, "", this),
|
||||
new Among ( "n\u00FCz", -1, -1, "", this),
|
||||
new Among ( "n\u0131z", -1, -1, "", this)
|
||||
private final static Among a_17[] = {
|
||||
new Among ( "niz", -1, -1, "", methodObject ),
|
||||
new Among ( "nuz", -1, -1, "", methodObject ),
|
||||
new Among ( "n\u00FCz", -1, -1, "", methodObject ),
|
||||
new Among ( "n\u0131z", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_18[] = {
|
||||
new Among ( "dir", -1, -1, "", this),
|
||||
new Among ( "tir", -1, -1, "", this),
|
||||
new Among ( "dur", -1, -1, "", this),
|
||||
new Among ( "tur", -1, -1, "", this),
|
||||
new Among ( "d\u00FCr", -1, -1, "", this),
|
||||
new Among ( "t\u00FCr", -1, -1, "", this),
|
||||
new Among ( "d\u0131r", -1, -1, "", this),
|
||||
new Among ( "t\u0131r", -1, -1, "", this)
|
||||
private final static Among a_18[] = {
|
||||
new Among ( "dir", -1, -1, "", methodObject ),
|
||||
new Among ( "tir", -1, -1, "", methodObject ),
|
||||
new Among ( "dur", -1, -1, "", methodObject ),
|
||||
new Among ( "tur", -1, -1, "", methodObject ),
|
||||
new Among ( "d\u00FCr", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u00FCr", -1, -1, "", methodObject ),
|
||||
new Among ( "d\u0131r", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u0131r", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_19[] = {
|
||||
new Among ( "cas\u0131na", -1, -1, "", this),
|
||||
new Among ( "cesine", -1, -1, "", this)
|
||||
private final static Among a_19[] = {
|
||||
new Among ( "cas\u0131na", -1, -1, "", methodObject ),
|
||||
new Among ( "cesine", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_20[] = {
|
||||
new Among ( "di", -1, -1, "", this),
|
||||
new Among ( "ti", -1, -1, "", this),
|
||||
new Among ( "dik", -1, -1, "", this),
|
||||
new Among ( "tik", -1, -1, "", this),
|
||||
new Among ( "duk", -1, -1, "", this),
|
||||
new Among ( "tuk", -1, -1, "", this),
|
||||
new Among ( "d\u00FCk", -1, -1, "", this),
|
||||
new Among ( "t\u00FCk", -1, -1, "", this),
|
||||
new Among ( "d\u0131k", -1, -1, "", this),
|
||||
new Among ( "t\u0131k", -1, -1, "", this),
|
||||
new Among ( "dim", -1, -1, "", this),
|
||||
new Among ( "tim", -1, -1, "", this),
|
||||
new Among ( "dum", -1, -1, "", this),
|
||||
new Among ( "tum", -1, -1, "", this),
|
||||
new Among ( "d\u00FCm", -1, -1, "", this),
|
||||
new Among ( "t\u00FCm", -1, -1, "", this),
|
||||
new Among ( "d\u0131m", -1, -1, "", this),
|
||||
new Among ( "t\u0131m", -1, -1, "", this),
|
||||
new Among ( "din", -1, -1, "", this),
|
||||
new Among ( "tin", -1, -1, "", this),
|
||||
new Among ( "dun", -1, -1, "", this),
|
||||
new Among ( "tun", -1, -1, "", this),
|
||||
new Among ( "d\u00FCn", -1, -1, "", this),
|
||||
new Among ( "t\u00FCn", -1, -1, "", this),
|
||||
new Among ( "d\u0131n", -1, -1, "", this),
|
||||
new Among ( "t\u0131n", -1, -1, "", this),
|
||||
new Among ( "du", -1, -1, "", this),
|
||||
new Among ( "tu", -1, -1, "", this),
|
||||
new Among ( "d\u00FC", -1, -1, "", this),
|
||||
new Among ( "t\u00FC", -1, -1, "", this),
|
||||
new Among ( "d\u0131", -1, -1, "", this),
|
||||
new Among ( "t\u0131", -1, -1, "", this)
|
||||
private final static Among a_20[] = {
|
||||
new Among ( "di", -1, -1, "", methodObject ),
|
||||
new Among ( "ti", -1, -1, "", methodObject ),
|
||||
new Among ( "dik", -1, -1, "", methodObject ),
|
||||
new Among ( "tik", -1, -1, "", methodObject ),
|
||||
new Among ( "duk", -1, -1, "", methodObject ),
|
||||
new Among ( "tuk", -1, -1, "", methodObject ),
|
||||
new Among ( "d\u00FCk", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u00FCk", -1, -1, "", methodObject ),
|
||||
new Among ( "d\u0131k", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u0131k", -1, -1, "", methodObject ),
|
||||
new Among ( "dim", -1, -1, "", methodObject ),
|
||||
new Among ( "tim", -1, -1, "", methodObject ),
|
||||
new Among ( "dum", -1, -1, "", methodObject ),
|
||||
new Among ( "tum", -1, -1, "", methodObject ),
|
||||
new Among ( "d\u00FCm", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u00FCm", -1, -1, "", methodObject ),
|
||||
new Among ( "d\u0131m", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u0131m", -1, -1, "", methodObject ),
|
||||
new Among ( "din", -1, -1, "", methodObject ),
|
||||
new Among ( "tin", -1, -1, "", methodObject ),
|
||||
new Among ( "dun", -1, -1, "", methodObject ),
|
||||
new Among ( "tun", -1, -1, "", methodObject ),
|
||||
new Among ( "d\u00FCn", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u00FCn", -1, -1, "", methodObject ),
|
||||
new Among ( "d\u0131n", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u0131n", -1, -1, "", methodObject ),
|
||||
new Among ( "du", -1, -1, "", methodObject ),
|
||||
new Among ( "tu", -1, -1, "", methodObject ),
|
||||
new Among ( "d\u00FC", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u00FC", -1, -1, "", methodObject ),
|
||||
new Among ( "d\u0131", -1, -1, "", methodObject ),
|
||||
new Among ( "t\u0131", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_21[] = {
|
||||
new Among ( "sa", -1, -1, "", this),
|
||||
new Among ( "se", -1, -1, "", this),
|
||||
new Among ( "sak", -1, -1, "", this),
|
||||
new Among ( "sek", -1, -1, "", this),
|
||||
new Among ( "sam", -1, -1, "", this),
|
||||
new Among ( "sem", -1, -1, "", this),
|
||||
new Among ( "san", -1, -1, "", this),
|
||||
new Among ( "sen", -1, -1, "", this)
|
||||
private final static Among a_21[] = {
|
||||
new Among ( "sa", -1, -1, "", methodObject ),
|
||||
new Among ( "se", -1, -1, "", methodObject ),
|
||||
new Among ( "sak", -1, -1, "", methodObject ),
|
||||
new Among ( "sek", -1, -1, "", methodObject ),
|
||||
new Among ( "sam", -1, -1, "", methodObject ),
|
||||
new Among ( "sem", -1, -1, "", methodObject ),
|
||||
new Among ( "san", -1, -1, "", methodObject ),
|
||||
new Among ( "sen", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_22[] = {
|
||||
new Among ( "mi\u015F", -1, -1, "", this),
|
||||
new Among ( "mu\u015F", -1, -1, "", this),
|
||||
new Among ( "m\u00FC\u015F", -1, -1, "", this),
|
||||
new Among ( "m\u0131\u015F", -1, -1, "", this)
|
||||
private final static Among a_22[] = {
|
||||
new Among ( "mi\u015F", -1, -1, "", methodObject ),
|
||||
new Among ( "mu\u015F", -1, -1, "", methodObject ),
|
||||
new Among ( "m\u00FC\u015F", -1, -1, "", methodObject ),
|
||||
new Among ( "m\u0131\u015F", -1, -1, "", methodObject )
|
||||
};
|
||||
|
||||
private Among a_23[] = {
|
||||
new Among ( "b", -1, 1, "", this),
|
||||
new Among ( "c", -1, 2, "", this),
|
||||
new Among ( "d", -1, 3, "", this),
|
||||
new Among ( "\u011F", -1, 4, "", this)
|
||||
private final static Among a_23[] = {
|
||||
new Among ( "b", -1, 1, "", methodObject ),
|
||||
new Among ( "c", -1, 2, "", methodObject ),
|
||||
new Among ( "d", -1, 3, "", methodObject ),
|
||||
new Among ( "\u011F", -1, 4, "", methodObject )
|
||||
};
|
||||
|
||||
private static final char g_vowel[] = {17, 65, 16, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 32, 8, 0, 0, 0, 0, 0, 0, 1 };
|
||||
|
@ -3126,5 +3133,15 @@ public class TurkishStemmer extends SnowballProgram {
|
|||
return true;
|
||||
}
|
||||
|
||||
public boolean equals( Object o ) {
|
||||
return o instanceof TurkishStemmer;
|
||||
}
|
||||
|
||||
public int hashCode() {
|
||||
return TurkishStemmer.class.getName().hashCode();
|
||||
}
|
||||
|
||||
|
||||
|
||||
}
|
||||
|
||||
|
|
|
@ -40,7 +40,6 @@ org.apache.lucene.analysis.en.PorterStemFilterFactory
|
|||
org.apache.lucene.analysis.es.SpanishLightStemFilterFactory
|
||||
org.apache.lucene.analysis.fa.PersianNormalizationFilterFactory
|
||||
org.apache.lucene.analysis.fi.FinnishLightStemFilterFactory
|
||||
org.apache.lucene.analysis.fr.ElisionFilterFactory
|
||||
org.apache.lucene.analysis.fr.FrenchLightStemFilterFactory
|
||||
org.apache.lucene.analysis.fr.FrenchMinimalStemFilterFactory
|
||||
org.apache.lucene.analysis.ga.IrishLowerCaseFilterFactory
|
||||
|
@ -88,3 +87,4 @@ org.apache.lucene.analysis.sv.SwedishLightStemFilterFactory
|
|||
org.apache.lucene.analysis.synonym.SynonymFilterFactory
|
||||
org.apache.lucene.analysis.th.ThaiWordFilterFactory
|
||||
org.apache.lucene.analysis.tr.TurkishLowerCaseFilterFactory
|
||||
org.apache.lucene.analysis.util.ElisionFilterFactory
|
||||
|
|
|
@ -18,6 +18,7 @@ package org.apache.lucene.analysis.cjk;
|
|||
*/
|
||||
|
||||
import java.io.Reader;
|
||||
import java.util.Random;
|
||||
|
||||
import org.apache.lucene.analysis.Analyzer;
|
||||
import org.apache.lucene.analysis.BaseTokenStreamTestCase;
|
||||
|
@ -33,6 +34,15 @@ public class TestCJKBigramFilter extends BaseTokenStreamTestCase {
|
|||
}
|
||||
};
|
||||
|
||||
Analyzer unibiAnalyzer = new Analyzer() {
|
||||
@Override
|
||||
protected TokenStreamComponents createComponents(String fieldName, Reader reader) {
|
||||
Tokenizer t = new StandardTokenizer(TEST_VERSION_CURRENT, reader);
|
||||
return new TokenStreamComponents(t,
|
||||
new CJKBigramFilter(t, 0xff, true));
|
||||
}
|
||||
};
|
||||
|
||||
public void testHuge() throws Exception {
|
||||
assertAnalyzesTo(analyzer, "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた"
|
||||
+ "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた"
|
||||
|
@ -62,6 +72,96 @@ public class TestCJKBigramFilter extends BaseTokenStreamTestCase {
|
|||
}
|
||||
};
|
||||
assertAnalyzesTo(a, "多くの学生が試験に落ちた。",
|
||||
new String[] { "多", "く", "の", "学生", "が", "試験", "に", "落", "ち", "た" });
|
||||
new String[] { "多", "く", "の", "学生", "が", "試験", "に", "落", "ち", "た" },
|
||||
new int[] { 0, 1, 2, 3, 5, 6, 8, 9, 10, 11 },
|
||||
new int[] { 1, 2, 3, 5, 6, 8, 9, 10, 11, 12 },
|
||||
new String[] { "<SINGLE>", "<HIRAGANA>", "<HIRAGANA>", "<DOUBLE>", "<HIRAGANA>", "<DOUBLE>",
|
||||
"<HIRAGANA>", "<SINGLE>", "<HIRAGANA>", "<HIRAGANA>", "<SINGLE>" },
|
||||
new int[] { 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 },
|
||||
new int[] { 1, 1, 1, 1, 1, 1, 1, 1, 1, 1 });
|
||||
}
|
||||
|
||||
public void testAllScripts() throws Exception {
|
||||
Analyzer a = new Analyzer() {
|
||||
@Override
|
||||
protected TokenStreamComponents createComponents(String fieldName, Reader reader) {
|
||||
Tokenizer t = new StandardTokenizer(TEST_VERSION_CURRENT, reader);
|
||||
return new TokenStreamComponents(t,
|
||||
new CJKBigramFilter(t, 0xff, false));
|
||||
}
|
||||
};
|
||||
assertAnalyzesTo(a, "多くの学生が試験に落ちた。",
|
||||
new String[] { "多く", "くの", "の学", "学生", "生が", "が試", "試験", "験に", "に落", "落ち", "ちた" });
|
||||
}
|
||||
|
||||
public void testUnigramsAndBigramsAllScripts() throws Exception {
|
||||
assertAnalyzesTo(unibiAnalyzer, "多くの学生が試験に落ちた。",
|
||||
new String[] {
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生",
|
||||
"生が", "が", "が試", "試", "試験", "験", "験に", "に",
|
||||
"に落", "落", "落ち", "ち", "ちた", "た"
|
||||
},
|
||||
new int[] { 0, 0, 1, 1, 2, 2, 3, 3, 4, 4, 5, 5, 6,
|
||||
6, 7, 7, 8, 8, 9, 9, 10, 10, 11 },
|
||||
new int[] { 1, 2, 2, 3, 3, 4, 4, 5, 5, 6, 6, 7, 7,
|
||||
8, 8, 9, 9, 10, 10, 11, 11, 12, 12 },
|
||||
new String[] { "<SINGLE>", "<DOUBLE>", "<SINGLE>", "<DOUBLE>", "<SINGLE>", "<DOUBLE>", "<SINGLE>", "<DOUBLE>",
|
||||
"<SINGLE>", "<DOUBLE>", "<SINGLE>", "<DOUBLE>", "<SINGLE>", "<DOUBLE>", "<SINGLE>", "<DOUBLE>",
|
||||
"<SINGLE>", "<DOUBLE>", "<SINGLE>", "<DOUBLE>", "<SINGLE>", "<DOUBLE>", "<SINGLE>" },
|
||||
new int[] { 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1, 0, 1,
|
||||
0, 1, 0, 1, 0, 1, 0, 1, 0, 1 },
|
||||
new int[] { 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1, 2, 1,
|
||||
2, 1, 2, 1, 2, 1, 2, 1, 2, 1 }
|
||||
);
|
||||
}
|
||||
|
||||
public void testUnigramsAndBigramsHanOnly() throws Exception {
|
||||
Analyzer a = new Analyzer() {
|
||||
@Override
|
||||
protected TokenStreamComponents createComponents(String fieldName, Reader reader) {
|
||||
Tokenizer t = new StandardTokenizer(TEST_VERSION_CURRENT, reader);
|
||||
return new TokenStreamComponents(t, new CJKBigramFilter(t, CJKBigramFilter.HAN, true));
|
||||
}
|
||||
};
|
||||
assertAnalyzesTo(a, "多くの学生が試験に落ちた。",
|
||||
new String[] { "多", "く", "の", "学", "学生", "生", "が", "試", "試験", "験", "に", "落", "ち", "た" },
|
||||
new int[] { 0, 1, 2, 3, 3, 4, 5, 6, 6, 7, 8, 9, 10, 11 },
|
||||
new int[] { 1, 2, 3, 4, 5, 5, 6, 7, 8, 8, 9, 10, 11, 12 },
|
||||
new String[] { "<SINGLE>", "<HIRAGANA>", "<HIRAGANA>", "<SINGLE>", "<DOUBLE>",
|
||||
"<SINGLE>", "<HIRAGANA>", "<SINGLE>", "<DOUBLE>", "<SINGLE>",
|
||||
"<HIRAGANA>", "<SINGLE>", "<HIRAGANA>", "<HIRAGANA>", "<SINGLE>" },
|
||||
new int[] { 1, 1, 1, 1, 0, 1, 1, 1, 0, 1, 1, 1, 1, 1 },
|
||||
new int[] { 1, 1, 1, 1, 2, 1, 1, 1, 2, 1, 1, 1, 1, 1 });
|
||||
}
|
||||
|
||||
public void testUnigramsAndBigramsHuge() throws Exception {
|
||||
assertAnalyzesTo(unibiAnalyzer, "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた"
|
||||
+ "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた"
|
||||
+ "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた" + "多くの学生が試験に落ちた",
|
||||
new String[] {
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生", "生が", "が", "が試", "試", "試験", "験", "験に", "に", "に落", "落", "落ち", "ち", "ちた", "た", "た多",
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生", "生が", "が", "が試", "試", "試験", "験", "験に", "に", "に落", "落", "落ち", "ち", "ちた", "た", "た多",
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生", "生が", "が", "が試", "試", "試験", "験", "験に", "に", "に落", "落", "落ち", "ち", "ちた", "た", "た多",
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生", "生が", "が", "が試", "試", "試験", "験", "験に", "に", "に落", "落", "落ち", "ち", "ちた", "た", "た多",
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生", "生が", "が", "が試", "試", "試験", "験", "験に", "に", "に落", "落", "落ち", "ち", "ちた", "た", "た多",
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生", "生が", "が", "が試", "試", "試験", "験", "験に", "に", "に落", "落", "落ち", "ち", "ちた", "た", "た多",
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生", "生が", "が", "が試", "試", "試験", "験", "験に", "に", "に落", "落", "落ち", "ち", "ちた", "た", "た多",
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生", "生が", "が", "が試", "試", "試験", "験", "験に", "に", "に落", "落", "落ち", "ち", "ちた", "た", "た多",
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生", "生が", "が", "が試", "試", "試験", "験", "験に", "に", "に落", "落", "落ち", "ち", "ちた", "た", "た多",
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生", "生が", "が", "が試", "試", "試験", "験", "験に", "に", "に落", "落", "落ち", "ち", "ちた", "た", "た多",
|
||||
"多", "多く", "く", "くの", "の", "の学", "学", "学生", "生", "生が", "が", "が試", "試", "試験", "験", "験に", "に", "に落", "落", "落ち", "ち", "ちた", "た"
|
||||
}
|
||||
);
|
||||
}
|
||||
|
||||
/** blast some random strings through the analyzer */
|
||||
public void testRandomUnibiStrings() throws Exception {
|
||||
checkRandomData(random(), unibiAnalyzer, 1000*RANDOM_MULTIPLIER);
|
||||
}
|
||||
|
||||
/** blast some random strings through the analyzer */
|
||||
public void testRandomUnibiHugeStrings() throws Exception {
|
||||
Random random = random();
|
||||
checkRandomData(random, unibiAnalyzer, 100*RANDOM_MULTIPLIER, 8192);
|
||||
}
|
||||
}
|
||||
|
|
|
@ -52,4 +52,16 @@ public class TestCJKBigramFilterFactory extends BaseTokenStreamTestCase {
|
|||
assertTokenStreamContents(stream,
|
||||
new String[] { "多", "く", "の", "学生", "が", "試験", "に", "落", "ち", "た" });
|
||||
}
|
||||
|
||||
public void testHanOnlyUnigrams() throws Exception {
|
||||
Reader reader = new StringReader("多くの学生が試験に落ちた。");
|
||||
CJKBigramFilterFactory factory = new CJKBigramFilterFactory();
|
||||
Map<String,String> args = new HashMap<String,String>();
|
||||
args.put("hiragana", "false");
|
||||
args.put("outputUnigrams", "true");
|
||||
factory.init(args);
|
||||
TokenStream stream = factory.create(new StandardTokenizer(TEST_VERSION_CURRENT, reader));
|
||||
assertTokenStreamContents(stream,
|
||||
new String[] { "多", "く", "の", "学", "学生", "生", "が", "試", "試験", "験", "に", "落", "ち", "た" });
|
||||
}
|
||||
}
|
||||
|
|
|
@ -23,7 +23,7 @@ import org.apache.lucene.analysis.TokenStream;
|
|||
import org.apache.lucene.analysis.Tokenizer;
|
||||
import org.apache.lucene.analysis.core.TestStopFilter;
|
||||
import org.apache.lucene.analysis.util.CharArraySet;
|
||||
import org.apache.lucene.analysis.util.ResourceAsStreamResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ClasspathResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ResourceLoader;
|
||||
|
||||
import java.io.StringReader;
|
||||
|
@ -39,7 +39,7 @@ import java.util.HashMap;
|
|||
public class TestCommonGramsFilterFactory extends BaseTokenStreamTestCase {
|
||||
|
||||
public void testInform() throws Exception {
|
||||
ResourceLoader loader = new ResourceAsStreamResourceLoader(TestStopFilter.class);
|
||||
ResourceLoader loader = new ClasspathResourceLoader(TestStopFilter.class);
|
||||
assertTrue("loader is null and it shouldn't be", loader != null);
|
||||
CommonGramsFilterFactory factory = new CommonGramsFilterFactory();
|
||||
Map<String, String> args = new HashMap<String, String>();
|
||||
|
@ -89,7 +89,7 @@ public class TestCommonGramsFilterFactory extends BaseTokenStreamTestCase {
|
|||
* If no words are provided, then a set of english default stopwords is used.
|
||||
*/
|
||||
public void testDefaults() throws Exception {
|
||||
ResourceLoader loader = new ResourceAsStreamResourceLoader(TestStopFilter.class);
|
||||
ResourceLoader loader = new ClasspathResourceLoader(TestStopFilter.class);
|
||||
assertTrue("loader is null and it shouldn't be", loader != null);
|
||||
CommonGramsFilterFactory factory = new CommonGramsFilterFactory();
|
||||
factory.setLuceneMatchVersion(TEST_VERSION_CURRENT);
|
||||
|
|
|
@ -23,7 +23,7 @@ import org.apache.lucene.analysis.TokenStream;
|
|||
import org.apache.lucene.analysis.Tokenizer;
|
||||
import org.apache.lucene.analysis.core.TestStopFilter;
|
||||
import org.apache.lucene.analysis.util.CharArraySet;
|
||||
import org.apache.lucene.analysis.util.ResourceAsStreamResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ClasspathResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ResourceLoader;
|
||||
|
||||
import java.io.StringReader;
|
||||
|
@ -39,7 +39,7 @@ import java.util.HashMap;
|
|||
public class TestCommonGramsQueryFilterFactory extends BaseTokenStreamTestCase {
|
||||
|
||||
public void testInform() throws Exception {
|
||||
ResourceLoader loader = new ResourceAsStreamResourceLoader(TestStopFilter.class);
|
||||
ResourceLoader loader = new ClasspathResourceLoader(TestStopFilter.class);
|
||||
assertTrue("loader is null and it shouldn't be", loader != null);
|
||||
CommonGramsQueryFilterFactory factory = new CommonGramsQueryFilterFactory();
|
||||
Map<String, String> args = new HashMap<String, String>();
|
||||
|
@ -89,7 +89,7 @@ public class TestCommonGramsQueryFilterFactory extends BaseTokenStreamTestCase {
|
|||
* If no words are provided, then a set of english default stopwords is used.
|
||||
*/
|
||||
public void testDefaults() throws Exception {
|
||||
ResourceLoader loader = new ResourceAsStreamResourceLoader(TestStopFilter.class);
|
||||
ResourceLoader loader = new ClasspathResourceLoader(TestStopFilter.class);
|
||||
assertTrue("loader is null and it shouldn't be", loader != null);
|
||||
CommonGramsQueryFilterFactory factory = new CommonGramsQueryFilterFactory();
|
||||
factory.setLuceneMatchVersion(TEST_VERSION_CURRENT);
|
||||
|
|
|
@ -26,7 +26,7 @@ import org.apache.lucene.analysis.BaseTokenStreamTestCase;
|
|||
import org.apache.lucene.analysis.MockTokenizer;
|
||||
import org.apache.lucene.analysis.TokenStream;
|
||||
import org.apache.lucene.analysis.Tokenizer;
|
||||
import org.apache.lucene.analysis.util.ResourceAsStreamResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ClasspathResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ResourceLoader;
|
||||
|
||||
/**
|
||||
|
@ -40,7 +40,7 @@ public class TestDictionaryCompoundWordTokenFilterFactory extends BaseTokenStrea
|
|||
Reader reader = new StringReader("I like to play softball");
|
||||
Tokenizer tokenizer = new MockTokenizer(reader, MockTokenizer.WHITESPACE, false);
|
||||
DictionaryCompoundWordTokenFilterFactory factory = new DictionaryCompoundWordTokenFilterFactory();
|
||||
ResourceLoader loader = new ResourceAsStreamResourceLoader(getClass());
|
||||
ResourceLoader loader = new ClasspathResourceLoader(getClass());
|
||||
Map<String,String> args = new HashMap<String,String>();
|
||||
args.put("dictionary", "compoundDictionary.txt");
|
||||
factory.setLuceneMatchVersion(TEST_VERSION_CURRENT);
|
||||
|
|
|
@ -26,7 +26,7 @@ import org.apache.lucene.analysis.BaseTokenStreamTestCase;
|
|||
import org.apache.lucene.analysis.MockTokenizer;
|
||||
import org.apache.lucene.analysis.TokenStream;
|
||||
import org.apache.lucene.analysis.Tokenizer;
|
||||
import org.apache.lucene.analysis.util.ResourceAsStreamResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ClasspathResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ResourceLoader;
|
||||
|
||||
/**
|
||||
|
@ -40,7 +40,7 @@ public class TestHyphenationCompoundWordTokenFilterFactory extends BaseTokenStre
|
|||
Reader reader = new StringReader("min veninde som er lidt af en læsehest");
|
||||
Tokenizer tokenizer = new MockTokenizer(reader, MockTokenizer.WHITESPACE, false);
|
||||
HyphenationCompoundWordTokenFilterFactory factory = new HyphenationCompoundWordTokenFilterFactory();
|
||||
ResourceLoader loader = new ResourceAsStreamResourceLoader(getClass());
|
||||
ResourceLoader loader = new ClasspathResourceLoader(getClass());
|
||||
Map<String,String> args = new HashMap<String,String>();
|
||||
args.put("hyphenator", "da_UTF8.xml");
|
||||
args.put("dictionary", "da_compoundDictionary.txt");
|
||||
|
@ -64,7 +64,7 @@ public class TestHyphenationCompoundWordTokenFilterFactory extends BaseTokenStre
|
|||
Reader reader = new StringReader("basketballkurv");
|
||||
Tokenizer tokenizer = new MockTokenizer(reader, MockTokenizer.WHITESPACE, false);
|
||||
HyphenationCompoundWordTokenFilterFactory factory = new HyphenationCompoundWordTokenFilterFactory();
|
||||
ResourceLoader loader = new ResourceAsStreamResourceLoader(getClass());
|
||||
ResourceLoader loader = new ClasspathResourceLoader(getClass());
|
||||
Map<String,String> args = new HashMap<String,String>();
|
||||
args.put("hyphenator", "da_UTF8.xml");
|
||||
args.put("minSubwordSize", "2");
|
||||
|
|
|
@ -285,8 +285,7 @@ public class TestClassicAnalyzer extends BaseTokenStreamTestCase {
|
|||
DocsAndPositionsEnum tps = MultiFields.getTermPositionsEnum(reader,
|
||||
MultiFields.getLiveDocs(reader),
|
||||
"content",
|
||||
new BytesRef("another"),
|
||||
false);
|
||||
new BytesRef("another"));
|
||||
assertTrue(tps.nextDoc() != DocIdSetIterator.NO_MORE_DOCS);
|
||||
assertEquals(1, tps.freq());
|
||||
assertEquals(3, tps.nextPosition());
|
||||
|
|
|
@ -103,7 +103,7 @@ public class TestKeywordAnalyzer extends BaseTokenStreamTestCase {
|
|||
new BytesRef("Q36"),
|
||||
MultiFields.getLiveDocs(reader),
|
||||
null,
|
||||
false);
|
||||
0);
|
||||
assertTrue(td.nextDoc() != DocIdSetIterator.NO_MORE_DOCS);
|
||||
td = _TestUtil.docs(random(),
|
||||
reader,
|
||||
|
@ -111,7 +111,7 @@ public class TestKeywordAnalyzer extends BaseTokenStreamTestCase {
|
|||
new BytesRef("Q37"),
|
||||
MultiFields.getLiveDocs(reader),
|
||||
null,
|
||||
false);
|
||||
0);
|
||||
assertTrue(td.nextDoc() != DocIdSetIterator.NO_MORE_DOCS);
|
||||
}
|
||||
|
||||
|
|
|
@ -19,7 +19,7 @@ package org.apache.lucene.analysis.core;
|
|||
|
||||
import org.apache.lucene.analysis.BaseTokenStreamTestCase;
|
||||
import org.apache.lucene.analysis.util.CharArraySet;
|
||||
import org.apache.lucene.analysis.util.ResourceAsStreamResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ClasspathResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ResourceLoader;
|
||||
|
||||
import java.util.Map;
|
||||
|
@ -32,7 +32,7 @@ import java.util.HashMap;
|
|||
public class TestStopFilterFactory extends BaseTokenStreamTestCase {
|
||||
|
||||
public void testInform() throws Exception {
|
||||
ResourceLoader loader = new ResourceAsStreamResourceLoader(getClass());
|
||||
ResourceLoader loader = new ClasspathResourceLoader(getClass());
|
||||
assertTrue("loader is null and it shouldn't be", loader != null);
|
||||
StopFilterFactory factory = new StopFilterFactory();
|
||||
Map<String, String> args = new HashMap<String, String>();
|
||||
|
|
|
@ -19,7 +19,7 @@ package org.apache.lucene.analysis.core;
|
|||
|
||||
import org.apache.lucene.analysis.BaseTokenStreamTestCase;
|
||||
import org.apache.lucene.analysis.NumericTokenStream;
|
||||
import org.apache.lucene.analysis.util.ResourceAsStreamResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ClasspathResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ResourceLoader;
|
||||
import org.junit.Test;
|
||||
|
||||
|
@ -34,7 +34,7 @@ public class TestTypeTokenFilterFactory extends BaseTokenStreamTestCase {
|
|||
|
||||
@Test
|
||||
public void testInform() throws Exception {
|
||||
ResourceLoader loader = new ResourceAsStreamResourceLoader(getClass());
|
||||
ResourceLoader loader = new ClasspathResourceLoader(getClass());
|
||||
TypeTokenFilterFactory factory = new TypeTokenFilterFactory();
|
||||
Map<String, String> args = new HashMap<String, String>();
|
||||
args.put("types", "stoptypes-1.txt");
|
||||
|
@ -94,7 +94,7 @@ public class TestTypeTokenFilterFactory extends BaseTokenStreamTestCase {
|
|||
args.put("enablePositionIncrements", "false");
|
||||
typeTokenFilterFactory.setLuceneMatchVersion(TEST_VERSION_CURRENT);
|
||||
typeTokenFilterFactory.init(args);
|
||||
typeTokenFilterFactory.inform(new ResourceAsStreamResourceLoader(getClass()));
|
||||
typeTokenFilterFactory.inform(new ClasspathResourceLoader(getClass()));
|
||||
fail("not supplying 'types' parameter should cause an IllegalArgumentException");
|
||||
} catch (IllegalArgumentException e) {
|
||||
// everything ok
|
||||
|
|
|
@ -25,7 +25,7 @@ import java.util.Map;
|
|||
import org.apache.lucene.analysis.BaseTokenStreamTestCase;
|
||||
import org.apache.lucene.analysis.MockTokenizer;
|
||||
import org.apache.lucene.analysis.TokenStream;
|
||||
import org.apache.lucene.analysis.util.ResourceAsStreamResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ClasspathResourceLoader;
|
||||
|
||||
/**
|
||||
* Simple tests to ensure the Hunspell stemmer loads from factory
|
||||
|
@ -38,7 +38,7 @@ public class TestHunspellStemFilterFactory extends BaseTokenStreamTestCase {
|
|||
args.put("affix", "test.aff");
|
||||
factory.setLuceneMatchVersion(TEST_VERSION_CURRENT);
|
||||
factory.init(args);
|
||||
factory.inform(new ResourceAsStreamResourceLoader(getClass()));
|
||||
factory.inform(new ClasspathResourceLoader(getClass()));
|
||||
|
||||
Reader reader = new StringReader("abc");
|
||||
TokenStream stream = factory.create(new MockTokenizer(reader, MockTokenizer.WHITESPACE, false));
|
||||
|
|
|
@ -19,7 +19,7 @@ package org.apache.lucene.analysis.miscellaneous;
|
|||
|
||||
import org.apache.lucene.analysis.BaseTokenStreamTestCase;
|
||||
import org.apache.lucene.analysis.util.CharArraySet;
|
||||
import org.apache.lucene.analysis.util.ResourceAsStreamResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ClasspathResourceLoader;
|
||||
import org.apache.lucene.analysis.util.ResourceLoader;
|
||||
|
||||
import java.util.Map;
|
||||
|
@ -32,7 +32,7 @@ import java.util.HashMap;
|
|||
public class TestKeepFilterFactory extends BaseTokenStreamTestCase {
|
||||
|
||||
public void testInform() throws Exception {
|
||||
ResourceLoader loader = new ResourceAsStreamResourceLoader(getClass());
|
||||
ResourceLoader loader = new ClasspathResourceLoader(getClass());
|
||||
assertTrue("loader is null and it shouldn't be", loader != null);
|
||||
KeepWordFilterFactory factory = new KeepWordFilterFactory();
|
||||
Map<String, String> args = new HashMap<String, String>();
|
||||
|
|
|
@ -111,7 +111,7 @@ public class TestTeeSinkTokenFilter extends BaseTokenStreamTestCase {
|
|||
TermsEnum termsEnum = vector.iterator(null);
|
||||
termsEnum.next();
|
||||
assertEquals(2, termsEnum.totalTermFreq());
|
||||
DocsAndPositionsEnum positions = termsEnum.docsAndPositions(null, null, true);
|
||||
DocsAndPositionsEnum positions = termsEnum.docsAndPositions(null, null);
|
||||
assertTrue(positions.nextDoc() != DocIdSetIterator.NO_MORE_DOCS);
|
||||
assertEquals(2, positions.freq());
|
||||
positions.nextPosition();
|
||||
|
|
|
@ -25,6 +25,7 @@ import org.apache.lucene.analysis.Analyzer;
|
|||
import org.apache.lucene.analysis.MockTokenizer;
|
||||
import org.apache.lucene.analysis.Tokenizer;
|
||||
import org.apache.lucene.analysis.TokenStream;
|
||||
import org.apache.lucene.analysis.Analyzer.TokenStreamComponents;
|
||||
import org.apache.lucene.analysis.core.KeywordTokenizer;
|
||||
import org.apache.lucene.analysis.standard.StandardAnalyzer;
|
||||
import org.apache.lucene.analysis.tokenattributes.CharTermAttribute;
|
||||
|
@ -116,4 +117,21 @@ public class TestSnowball extends BaseTokenStreamTestCase {
|
|||
checkOneTermReuse(a, "", "");
|
||||
}
|
||||
}
|
||||
|
||||
public void testRandomStrings() throws IOException {
|
||||
for (String lang : SNOWBALL_LANGS) {
|
||||
checkRandomStrings(lang);
|
||||
}
|
||||
}
|
||||
|
||||
public void checkRandomStrings(final String snowballLanguage) throws IOException {
|
||||
Analyzer a = new Analyzer() {
|
||||
@Override
|
||||
protected TokenStreamComponents createComponents(String fieldName, Reader reader) {
|
||||
Tokenizer t = new MockTokenizer(reader);
|
||||
return new TokenStreamComponents(t, new SnowballFilter(t, snowballLanguage));
|
||||
}
|
||||
};
|
||||
checkRandomData(random(), a, 1000*RANDOM_MULTIPLIER);
|
||||
}
|
||||
}
|
Some files were not shown because too many files have changed in this diff Show More
Loading…
Reference in New Issue