2015-11-06 17:04:59 -05:00
|
|
|
/*
|
|
|
|
* Licensed to Elasticsearch under one or more contributor
|
|
|
|
* license agreements. See the NOTICE file distributed with
|
|
|
|
* this work for additional information regarding copyright
|
|
|
|
* ownership. Elasticsearch licenses this file to you under
|
|
|
|
* the Apache License, Version 2.0 (the "License"); you may
|
|
|
|
* not use this file except in compliance with the License.
|
|
|
|
* You may obtain a copy of the License at
|
|
|
|
*
|
|
|
|
* http://www.apache.org/licenses/LICENSE-2.0
|
|
|
|
*
|
|
|
|
* Unless required by applicable law or agreed to in writing,
|
|
|
|
* software distributed under the License is distributed on an
|
|
|
|
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
|
|
|
|
* KIND, either express or implied. See the License for the
|
|
|
|
* specific language governing permissions and limitations
|
|
|
|
* under the License.
|
|
|
|
*/
|
|
|
|
|
|
|
|
esplugin {
|
|
|
|
description 'The mapper attachments plugin adds the attachment type to Elasticsearch using Apache Tika.'
|
2015-11-07 17:45:16 -05:00
|
|
|
classname 'org.elasticsearch.mapper.attachments.MapperAttachmentsPlugin'
|
2015-11-06 17:04:59 -05:00
|
|
|
}
|
|
|
|
|
2015-11-10 17:58:46 -05:00
|
|
|
versions << [
|
|
|
|
'tika': '1.11',
|
|
|
|
'pdfbox': '1.8.10',
|
|
|
|
'bouncycastle': '1.52',
|
|
|
|
'poi': '3.13'
|
|
|
|
]
|
|
|
|
|
2015-11-06 17:04:59 -05:00
|
|
|
dependencies {
|
2015-11-07 21:00:00 -05:00
|
|
|
// mandatory for tika
|
2015-11-10 17:58:46 -05:00
|
|
|
compile "org.apache.tika:tika-core:${versions.tika}"
|
|
|
|
compile "org.apache.tika:tika-parsers:${versions.tika}"
|
|
|
|
compile 'commons-io:commons-io:2.4'
|
2015-11-07 21:00:00 -05:00
|
|
|
|
|
|
|
// character set detection
|
2015-11-10 17:58:46 -05:00
|
|
|
compile 'com.googlecode.juniversalchardet:juniversalchardet:1.0.3'
|
2015-11-07 21:00:00 -05:00
|
|
|
|
|
|
|
// external parser libraries
|
|
|
|
// HTML
|
2015-11-10 17:58:46 -05:00
|
|
|
compile 'org.ccil.cowan.tagsoup:tagsoup:1.2.1'
|
2015-11-07 21:00:00 -05:00
|
|
|
// Adobe PDF
|
2015-11-10 17:58:46 -05:00
|
|
|
compile "org.apache.pdfbox:pdfbox:${versions.pdfbox}"
|
|
|
|
compile "org.apache.pdfbox:fontbox:${versions.pdfbox}"
|
|
|
|
compile "org.apache.pdfbox:jempbox:${versions.pdfbox}"
|
2015-11-10 18:13:54 -05:00
|
|
|
compile "commons-logging:commons-logging:${versions.commonslogging}"
|
2015-11-10 17:58:46 -05:00
|
|
|
compile "org.bouncycastle:bcmail-jdk15on:${versions.bouncycastle}"
|
|
|
|
compile "org.bouncycastle:bcprov-jdk15on:${versions.bouncycastle}"
|
|
|
|
compile "org.bouncycastle:bcpkix-jdk15on:${versions.bouncycastle}"
|
2015-11-07 21:00:00 -05:00
|
|
|
// OpenOffice
|
2015-11-10 17:58:46 -05:00
|
|
|
compile "org.apache.poi:poi-ooxml:${versions.poi}"
|
|
|
|
compile "org.apache.poi:poi:${versions.poi}"
|
|
|
|
compile "org.apache.poi:poi-ooxml-schemas:${versions.poi}"
|
|
|
|
compile "commons-codec:commons-codec:${versions.commonscodec}"
|
|
|
|
compile 'org.apache.xmlbeans:xmlbeans:2.6.0'
|
|
|
|
compile 'stax:stax-api:1.0.1'
|
2015-11-07 21:00:00 -05:00
|
|
|
// MS Office
|
2015-11-10 17:58:46 -05:00
|
|
|
compile "org.apache.poi:poi-scratchpad:${versions.poi}"
|
2015-11-07 21:00:00 -05:00
|
|
|
// Apple iWork
|
2015-11-10 17:58:46 -05:00
|
|
|
compile 'org.apache.commons:commons-compress:1.10'
|
2015-11-06 17:04:59 -05:00
|
|
|
}
|
|
|
|
|
|
|
|
compileJava.options.compilerArgs << '-Xlint:-cast,-deprecation,-rawtypes'
|
|
|
|
|
|
|
|
forbiddenPatterns {
|
|
|
|
exclude '**/*.docx'
|
|
|
|
exclude '**/*.pdf'
|
2015-11-09 11:30:58 -05:00
|
|
|
exclude '**/*.epub'
|
2015-11-06 17:04:59 -05:00
|
|
|
}
|
2015-12-16 16:38:16 -05:00
|
|
|
|
|
|
|
// classes are missing, e.g. org.openxmlformats.schemas.drawingml.x2006.chart.CTExtensionList
|
|
|
|
thirdPartyAudit.lenient = true
|
|
|
|
thirdPartyAudit.excludes = [
|
2015-12-16 18:56:02 -05:00
|
|
|
// uses internal java api: com.sun.syndication (SyndFeedInput, SyndFeed, SyndEntry, SyndContent)
|
2015-12-16 16:38:16 -05:00
|
|
|
'org.apache.tika.parser.feed.FeedParser',
|
|
|
|
]
|