SOLR-11794: Restart replicate from ledaer on core reload on PULL replicas

This commit is contained in:
Tomas Fernandez Lobbe 2018-01-15 16:15:14 -08:00
parent a08f71279c
commit 1c4b417c50
3 changed files with 51 additions and 32 deletions

View File

@ -104,6 +104,8 @@ Bug Fixes
* SOLR-11839: Fix test failures resulting from SOLR-11218 (Erick Erickson) * SOLR-11839: Fix test failures resulting from SOLR-11218 (Erick Erickson)
* SOLR-11794: PULL replicas stop replicating after collection RELOAD (Samuel Tatipamula, Tomás Fernández Löbbe)
Optimizations Optimizations
---------------------- ----------------------

View File

@ -1300,6 +1300,9 @@ public class CoreContainer {
getZkController().startReplicationFromLeader(newCore.getName(), true); getZkController().startReplicationFromLeader(newCore.getName(), true);
} }
} else if(replica.getType() == Replica.Type.PULL) {
getZkController().stopReplicationFromLeader(core.getName());
getZkController().startReplicationFromLeader(newCore.getName(), false);
} }
} }
} catch (SolrCoreState.CoreIsClosedException e) { } catch (SolrCoreState.CoreIsClosedException e) {

View File

@ -214,45 +214,59 @@ public class TestPullReplica extends SolrCloudTestCase {
@SuppressWarnings("unchecked") @SuppressWarnings("unchecked")
public void testAddDocs() throws Exception { public void testAddDocs() throws Exception {
int numReadOnlyReplicas = 1 + random().nextInt(3); int numPullReplicas = 1 + random().nextInt(3);
CollectionAdminRequest.createCollection(collectionName, "conf", 1, 1, 0, numReadOnlyReplicas) CollectionAdminRequest.createCollection(collectionName, "conf", 1, 1, 0, numPullReplicas)
.setMaxShardsPerNode(100) .setMaxShardsPerNode(100)
.process(cluster.getSolrClient()); .process(cluster.getSolrClient());
waitForState("Expected collection to be created with 1 shard and " + (numReadOnlyReplicas + 1) + " replicas", collectionName, clusterShape(1, numReadOnlyReplicas + 1)); waitForState("Expected collection to be created with 1 shard and " + (numPullReplicas + 1) + " replicas", collectionName, clusterShape(1, numPullReplicas + 1));
DocCollection docCollection = assertNumberOfReplicas(1, 0, numReadOnlyReplicas, false, true); DocCollection docCollection = assertNumberOfReplicas(1, 0, numPullReplicas, false, true);
assertEquals(1, docCollection.getSlices().size()); assertEquals(1, docCollection.getSlices().size());
cluster.getSolrClient().add(collectionName, new SolrInputDocument("id", "1", "foo", "bar")); boolean reloaded = false;
cluster.getSolrClient().commit(collectionName); int numDocs = 0;
while (true) {
numDocs++;
cluster.getSolrClient().add(collectionName, new SolrInputDocument("id", String.valueOf(numDocs), "foo", "bar"));
cluster.getSolrClient().commit(collectionName);
Slice s = docCollection.getSlices().iterator().next(); Slice s = docCollection.getSlices().iterator().next();
try (HttpSolrClient leaderClient = getHttpSolrClient(s.getLeader().getCoreUrl())) { try (HttpSolrClient leaderClient = getHttpSolrClient(s.getLeader().getCoreUrl())) {
assertEquals(1, leaderClient.query(new SolrQuery("*:*")).getResults().getNumFound()); assertEquals(numDocs, leaderClient.query(new SolrQuery("*:*")).getResults().getNumFound());
} }
TimeOut t = new TimeOut(REPLICATION_TIMEOUT_SECS, TimeUnit.SECONDS, TimeSource.NANO_TIME); TimeOut t = new TimeOut(REPLICATION_TIMEOUT_SECS, TimeUnit.SECONDS, TimeSource.NANO_TIME);
for (Replica r:s.getReplicas(EnumSet.of(Replica.Type.PULL))) { for (Replica r:s.getReplicas(EnumSet.of(Replica.Type.PULL))) {
//TODO: assert replication < REPLICATION_TIMEOUT_SECS //TODO: assert replication < REPLICATION_TIMEOUT_SECS
try (HttpSolrClient readOnlyReplicaClient = getHttpSolrClient(r.getCoreUrl())) { try (HttpSolrClient pullReplicaClient = getHttpSolrClient(r.getCoreUrl())) {
while (true) { while (true) {
try { try {
assertEquals("Replica " + r.getName() + " not up to date after 10 seconds", assertEquals("Replica " + r.getName() + " not up to date after 10 seconds",
1, readOnlyReplicaClient.query(new SolrQuery("*:*")).getResults().getNumFound()); numDocs, pullReplicaClient.query(new SolrQuery("*:*")).getResults().getNumFound());
break; break;
} catch (AssertionError e) { } catch (AssertionError e) {
if (t.hasTimedOut()) { if (t.hasTimedOut()) {
throw e; throw e;
} else { } else {
Thread.sleep(100); Thread.sleep(100);
}
} }
} }
SolrQuery req = new SolrQuery(
"qt", "/admin/plugins",
"stats", "true");
QueryResponse statsResponse = pullReplicaClient.query(req);
assertEquals("Replicas shouldn't process the add document request: " + statsResponse,
0L, ((Map<String, Object>)((NamedList<Object>)statsResponse.getResponse()).findRecursive("plugins", "UPDATE", "updateHandler", "stats")).get("UPDATE.updateHandler.adds"));
} }
SolrQuery req = new SolrQuery( }
"qt", "/admin/plugins", if (reloaded) {
"stats", "true"); break;
QueryResponse statsResponse = readOnlyReplicaClient.query(req); } else {
assertEquals("Replicas shouldn't process the add document request: " + statsResponse, // reload
0L, ((Map<String, Object>)((NamedList<Object>)statsResponse.getResponse()).findRecursive("plugins", "UPDATE", "updateHandler", "stats")).get("UPDATE.updateHandler.adds")); CollectionAdminResponse response = CollectionAdminRequest.reloadCollection(collectionName)
.process(cluster.getSolrClient());
assertEquals(0, response.getStatus());
reloaded = true;
} }
} }
assertUlogPresence(docCollection); assertUlogPresence(docCollection);