Add ignoreAttachements option for couchDb river

This commit is contained in:
David Pilato 2011-08-27 16:40:00 +02:00 committed by Shay Banon
parent ba352e0dc6
commit 1f30681a84
3 changed files with 100 additions and 2 deletions

1
plugins/river/couchdb/.gitignore vendored Normal file
View File

@ -0,0 +1 @@
/data

View File

@ -62,6 +62,7 @@ import static org.elasticsearch.common.xcontent.XContentFactory.*;
/**
* @author kimchy (shay.banon)
* @author dadoonet (David Pilato) for attachments filter
*/
public class CouchdbRiver extends AbstractRiverComponent implements River {
@ -75,6 +76,7 @@ public class CouchdbRiver extends AbstractRiverComponent implements River {
private final String couchFilter;
private final String couchFilterParamsUrl;
private final String basicAuth;
private final boolean couchIgnoreAttachements;
private final String indexName;
private final String typeName;
@ -116,6 +118,7 @@ public class CouchdbRiver extends AbstractRiverComponent implements River {
} else {
couchFilterParamsUrl = null;
}
couchIgnoreAttachements = XContentMapValues.nodeBooleanValue(couchSettings.get("ignore_attachments"), false);
if (couchSettings.containsKey("user") && couchSettings.containsKey("password")) {
String user = couchSettings.get("user").toString();
String password = couchSettings.get("password").toString();
@ -135,6 +138,7 @@ public class CouchdbRiver extends AbstractRiverComponent implements River {
couchDb = "db";
couchFilter = null;
couchFilterParamsUrl = null;
couchIgnoreAttachements = false;
basicAuth = null;
script = null;
}
@ -214,7 +218,9 @@ public class CouchdbRiver extends AbstractRiverComponent implements River {
// Ignore design documents
if (id.startsWith("_design/")) {
logger.trace("ignoring design document {}", id);
if (logger.isTraceEnabled()) {
logger.trace("ignoring design document {}", id);
}
return seq;
}
@ -246,7 +252,23 @@ public class CouchdbRiver extends AbstractRiverComponent implements River {
if (logger.isTraceEnabled()) {
logger.trace("processing [index ]: [{}]/[{}]/[{}], source {}", index, type, id, doc);
}
bulk.add(indexRequest(index).type(type).id(id).source(doc).routing(extractRouting(ctx)));
// Remove _attachement from doc if needed
// TODO : check if couchDB support now attachment filter : https://issues.apache.org/jira/browse/COUCHDB-1263
if (couchIgnoreAttachements) {
if (doc.containsKey("_attachments")) {
Map<String, Object> _attachments = (Map<String, Object>) doc
.get("_attachments");
if (_attachments != null) {
doc.remove("_attachments");
if (logger.isTraceEnabled()) {
logger.trace("_attachments found and removed from doc");
}
}
}
}
bulk.add(indexRequest(index).type(type).id(id).source(doc).routing(extractRouting(ctx)));
} else {
logger.warn("ignoring unknown change {}", s);
}
@ -381,6 +403,8 @@ public class CouchdbRiver extends AbstractRiverComponent implements River {
file = file + couchFilterParamsUrl;
}
}
// TODO : check if couchDB support now attachment filter : https://issues.apache.org/jira/browse/COUCHDB-1263
if (lastSeq != null) {
file = file + "&since=" + lastSeq;
}

View File

@ -0,0 +1,73 @@
/*
* Licensed to Elastic Search and Shay Banon under one
* or more contributor license agreements. See the NOTICE file
* distributed with this work for additional information
* regarding copyright ownership. Elastic Search licenses this
* file to you under the Apache License, Version 2.0 (the
* "License"); you may not use this file except in compliance
* with the License. You may obtain a copy of the License at
*
* http://www.apache.org/licenses/LICENSE-2.0
*
* Unless required by applicable law or agreed to in writing,
* software distributed under the License is distributed on an
* "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
* KIND, either express or implied. See the License for the
* specific language governing permissions and limitations
* under the License.
*/
package org.elasticsearch.river.couchdb;
import static org.elasticsearch.common.xcontent.XContentFactory.jsonBuilder;
import org.elasticsearch.action.admin.indices.delete.DeleteIndexRequest;
import org.elasticsearch.common.settings.ImmutableSettings;
import org.elasticsearch.common.xcontent.XContentBuilder;
import org.elasticsearch.indices.IndexMissingException;
import org.elasticsearch.node.Node;
import org.elasticsearch.node.NodeBuilder;
/**
* This is a simple test case for testing attachements removing.<br>
* You may have a couchdb instance running on localhost:5984 with a mytest database.<br>
* If you push documents with attachements in it, attachements should be ignored by the river.
* @author dadoonet (David Pilato)
*/
public class CouchdbRiverAttachementTest {
public static void main(String[] args) throws Exception {
String host = "localhost";
String port = "5984";
String db = "mytest";
boolean ignoreAttachements = true;
Node node = NodeBuilder.nodeBuilder().settings(ImmutableSettings.settingsBuilder().put("gateway.type", "local")).node();
Thread.sleep(1000);
try {
node.client().admin().indices().delete(new DeleteIndexRequest("_river")).actionGet();
} catch (IndexMissingException e) {
// Index does not exist... Fine
}
Thread.sleep(1000);
try {
node.client().admin().indices().delete(new DeleteIndexRequest(db)).actionGet();
} catch (IndexMissingException e) {
// Index does not exist... Fine
}
XContentBuilder xb = jsonBuilder()
.startObject()
.field("type", "couchdb")
.startObject("couchdb")
.field("host", host)
.field("port", port)
.field("db", db)
.field("ignoreAttachements", ignoreAttachements)
.endObject()
.endObject();
node.client().prepareIndex("_river", db, "_meta").setSource(xb).execute().actionGet();
Thread.sleep(100000);
}
}