mirror of https://github.com/apache/lucene.git
143 lines
5.4 KiB
XML
143 lines
5.4 KiB
XML
<?xml version="1.0"?>
|
|
|
|
<!--
|
|
Licensed to the Apache Software Foundation (ASF) under one or more
|
|
contributor license agreements. See the NOTICE file distributed with
|
|
this work for additional information regarding copyright ownership.
|
|
The ASF licenses this file to You under the Apache License, Version 2.0
|
|
the "License"); you may not use this file except in compliance with
|
|
the License. You may obtain a copy of the License at
|
|
|
|
http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
Unless required by applicable law or agreed to in writing, software
|
|
distributed under the License is distributed on an "AS IS" BASIS,
|
|
WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
See the License for the specific language governing permissions and
|
|
limitations under the License.
|
|
-->
|
|
|
|
<project name="analyzers-kuromoji" default="default">
|
|
|
|
<description>
|
|
Kuromoji Japanese Morphological Analyzer
|
|
</description>
|
|
|
|
<property name="build.dir" location="../build/kuromoji" />
|
|
<property name="dist.dir" location="../dist/kuromoji" />
|
|
|
|
<!-- default configuration: uses mecab-ipadic -->
|
|
<property name="ipadic.version" value="mecab-ipadic-2.7.0-20070801" />
|
|
<property name="dict.src.file" value="${ipadic.version}.tar.gz" />
|
|
<property name="dict.url" value="http://mecab.googlecode.com/files/${dict.src.file}"/>
|
|
|
|
<!-- alternative configuration: uses mecab-naist-jdic
|
|
<property name="ipadic.version" value="mecab-naist-jdic-0.6.3b-20111013" />
|
|
<property name="dict.src.file" value="${ipadic.version}.tar.gz" />
|
|
<property name="dict.url" value="http://sourceforge.jp/frs/redir.php?m=iij&f=/naist-jdic/53500/${dict.src.file}"/>
|
|
-->
|
|
|
|
<property name="dict.src.dir" value="${build.dir}/${ipadic.version}" />
|
|
<property name="dict.encoding" value="euc-jp"/>
|
|
<property name="dict.format" value="ipadic"/>
|
|
<property name="dict.normalize" value="false"/>
|
|
<property name="dict.target.dir" location="./src/resources"/>
|
|
|
|
<!-- currently whether rat detects this as binary or not
|
|
is platform dependent?! -->
|
|
<property name="rat.excludes" value="**/*.txt,**/bocchan.utf-8"/>
|
|
<import file="../../../lucene/module-build.xml"/>
|
|
|
|
<available type="dir" file="${build.dir}/${ipadic.version}" property="dict.available"/>
|
|
|
|
<path id="classpath">
|
|
<pathelement path="${analyzers-common.jar}"/>
|
|
<path refid="base.classpath"/>
|
|
</path>
|
|
|
|
<target name="compile-core" depends="jar-analyzers-common, common.compile-core" />
|
|
<target name="download-dict" unless="dict.available">
|
|
<get src="${dict.url}" dest="${build.dir}/${dict.src.file}"/>
|
|
<gunzip src="${build.dir}/${dict.src.file}"/>
|
|
<untar src="${build.dir}/${ipadic.version}.tar" dest="${build.dir}"/>
|
|
</target>
|
|
|
|
<path id="tools.dependencies">
|
|
<fileset dir="../icu/lib" includes="icu4j-4.8.1.1.jar"/>
|
|
</path>
|
|
|
|
<path id="tools.classpath">
|
|
<path refid="classpath"/>
|
|
<path refid="tools.dependencies"/>
|
|
<pathelement location="${build.dir}/classes/java"/>
|
|
<pathelement location="${build.dir}/classes/tools"/>
|
|
</path>
|
|
|
|
<path id="tools.test.classpath">
|
|
<path refid="tools.classpath"/>
|
|
<path refid="test.base.classpath"/>
|
|
<pathelement location="${build.dir}/classes/tools-test"/>
|
|
</path>
|
|
|
|
<target name="build-dict" depends="compile-tools, download-dict">
|
|
<sequential>
|
|
<delete verbose="true">
|
|
<fileset dir="src/resources/org/apache/lucene/analysis/ja/dict" includes="**/*"/>
|
|
</delete>
|
|
<!-- TODO: optimize the dictionary construction a bit so that you don't need 1G -->
|
|
<java fork="true" failonerror="true" maxmemory="1g" classname="org.apache.lucene.analysis.ja.util.DictionaryBuilder">
|
|
<classpath>
|
|
<path refid="tools.classpath"/>
|
|
<pathelement path="${build.dir}/classes/tools"/>
|
|
</classpath>
|
|
<assertions>
|
|
<enable package="org.apache.lucene"/>
|
|
</assertions>
|
|
<arg value="${dict.format}"/>
|
|
<arg value="${dict.src.dir}"/>
|
|
<arg value="${dict.target.dir}"/>
|
|
<arg value="${dict.encoding}"/>
|
|
<arg value="${dict.normalize}"/>
|
|
</java>
|
|
</sequential>
|
|
</target>
|
|
|
|
<!-- we don't actually need to compile this thing, we just want its lib -->
|
|
<target name="resolve-icu">
|
|
<ant dir="../icu/" target="resolve" inheritAll="false">
|
|
<propertyset refid="uptodate.and.compiled.properties"/>
|
|
</ant>
|
|
</target>
|
|
|
|
<target name="compile-tools" depends="resolve-icu, compile-core, common.compile-tools">
|
|
<compile
|
|
srcdir="src/tools/java"
|
|
destdir="${build.dir}/classes/tools">
|
|
<classpath>
|
|
<path refid="tools.classpath"/>
|
|
<pathelement path="src/tools/java"/>
|
|
</classpath>
|
|
</compile>
|
|
</target>
|
|
|
|
<target name="compile-tools-tests" depends="compile-tools">
|
|
<compile
|
|
srcdir="src/tools/test"
|
|
destdir="${build.dir}/classes/tools-test">
|
|
<classpath>
|
|
<path refid="tools.test.classpath"/>
|
|
<pathelement path="src/tools/test"/>
|
|
</classpath>
|
|
</compile>
|
|
</target>
|
|
|
|
<target name="test-tools" depends="compile-tools-tests">
|
|
<test-macro dataDir="src/tools/test" junit.classpath="tools.test.classpath"/>
|
|
</target>
|
|
|
|
<target name="compile-test" depends="module-build.compile-test, compile-tools-tests"/>
|
|
<!-- TODO: not until we properly make 'test-tools' work with clover etc
|
|
<target name="test" depends="module-build.test, test-tools"/> -->
|
|
|
|
</project>
|