bring back the primary shard chasing to the PrimaryPhase

martijnvg · martijnvg · commit 3f6407632561 · 2015-08-25T13:28:17.000+02:00
diff --git a/core/src/main/java/org/elasticsearch/action/support/replication/TransportReplicationAction.java b/core/src/main/java/org/elasticsearch/action/support/replication/TransportReplicationAction.java
@@ -293,6 +293,8 @@ public void onFailure(Throwable t) {
         @Override
         protected void doRun() throws Exception {
             final ShardRouting primary = request.internalShardRouting;
+            // Although this gets executed locally, this more of an assertion, but if change the primary action
+            // to be performed remotely this check is important to check before performing the action:
             if (clusterService.localNode().id().equals(primary.currentNodeId()) == false) {
                 throw new NoShardAvailableActionException(primary.shardId(), "shard [{}] not assigned to this node [{}], but node [{}]", primary.shardId(), clusterService.localNode().id(), primary.currentNodeId());
             }
@@ -563,7 +565,7 @@ protected void doRun() {
                 retryBecauseUnavailable(shardIt.shardId(), "Primary shard is not active or isn't assigned to a known node.");
                 return;
             }
-            moveToPrimaryAction(primary);
+            routeRequestOrPerformPrimaryActionLocally(primary);
         }
 
         /**
@@ -618,52 +620,92 @@ protected ShardRouting resolvePrimary(ShardIterator shardIt) {
         /**
          * send the request to the node holding the primary or execute if local
          */
-        protected void moveToPrimaryAction(final ShardRouting primary) {
+        protected void routeRequestOrPerformPrimaryActionLocally(final ShardRouting primary) {
             DiscoveryNode node = observer.observedState().nodes().get(primary.currentNodeId());
-            Request request = internalRequest.request();
-            request.internalShardRouting = primary;
-            transportService.sendRequest(node, transportPrimaryAction, request, transportOptions, new BaseTransportResponseHandler<Response>() {
+            if (primary.currentNodeId().equals(observer.observedState().nodes().localNodeId())) {
+                Request request = internalRequest.request();
+                request.internalShardRouting = primary;
+                // this call is always local, but in the future we can send to remote nodes as well
+                transportService.sendRequest(node, transportPrimaryAction, request, transportOptions, new BaseTransportResponseHandler<Response>() {
 
-                @Override
-                public Response newInstance() {
-                    return newResponseInstance();
-                }
+                    @Override
+                    public Response newInstance() {
+                        return newResponseInstance();
+                    }
 
-                @Override
-                public String executor() {
-                    return ThreadPool.Names.SAME;
-                }
+                    @Override
+                    public String executor() {
+                        return ThreadPool.Names.SAME;
+                    }
 
-                @Override
-                public void handleResponse(Response response) {
-                    finishOnRemoteSuccess(response);
-                }
+                    @Override
+                    public void handleResponse(Response response) {
+                        finishOnRemoteSuccess(response);
+                    }
 
-                @Override
-                public void handleException(TransportException exp) {
-                    try {
-                        Throwable cause = exp.getCause();
-                        // if we got disconnected from the node, or the node / shard is not in the right state (being closed)
-                        if (cause instanceof ConnectTransportException || cause instanceof NodeClosedException ||
-                                cause instanceof UnavailableShardsException || retryPrimaryException(cause)) {
-                            internalRequest.request().setCanHaveDuplicates();
-                            // we already marked it as started when we executed it (removed the listener) so pass false
-                            // to re-add to the cluster listener
-                            logger.trace("received an error from node the primary was assigned to ({}), scheduling a retry", exp.getMessage());
-                            if (cause instanceof UnavailableShardsException) {
-                                UnavailableShardsException use = (UnavailableShardsException) cause;
-                                retryBecauseUnavailable(use.getShardId(), use.getMessage());
+                    @Override
+                    public void handleException(TransportException exp) {
+                        try {
+                            Throwable cause = exp.getCause();
+                            // if we got disconnected from the node, or the node / shard is not in the right state (being closed)
+                            if (cause instanceof ConnectTransportException || cause instanceof NodeClosedException ||
+                                    cause instanceof UnavailableShardsException || retryPrimaryException(cause)) {
+                                internalRequest.request().setCanHaveDuplicates();
+                                // we already marked it as started when we executed it (removed the listener) so pass false
+                                // to re-add to the cluster listener
+                                logger.trace("received an error from node the primary was assigned to ({}), scheduling a retry", exp.getMessage());
+                                if (cause instanceof UnavailableShardsException) {
+                                    UnavailableShardsException use = (UnavailableShardsException) cause;
+                                    retryBecauseUnavailable(use.getShardId(), use.getMessage());
+                                } else {
+                                    retry(exp);
+                                }
                             } else {
+                                finishAsFailed(exp);
+                            }
+                        } catch (Throwable t) {
+                            finishWithUnexpectedFailure(t);
+                        }
+                    }
+                });
+            } else {
+                transportService.sendRequest(node, actionName, internalRequest.request(), transportOptions, new BaseTransportResponseHandler<Response>() {
+
+                    @Override
+                    public Response newInstance() {
+                        return newResponseInstance();
+                    }
+
+                    @Override
+                    public String executor() {
+                        return ThreadPool.Names.SAME;
+                    }
+
+                    @Override
+                    public void handleResponse(Response response) {
+                        finishOnRemoteSuccess(response);
+                    }
+
+                    @Override
+                    public void handleException(TransportException exp) {
+                        try {
+                            // if we got disconnected from the node, or the node / shard is not in the right state (being closed)
+                            if (exp.unwrapCause() instanceof ConnectTransportException || exp.unwrapCause() instanceof NodeClosedException ||
+                                    retryPrimaryException(exp)) {
+                                internalRequest.request().setCanHaveDuplicates();
+                                // we already marked it as started when we executed it (removed the listener) so pass false
+                                // to re-add to the cluster listener
+                                logger.trace("received an error from node the primary was assigned to ({}), scheduling a retry", exp.getMessage());
                                 retry(exp);
+                            } else {
+                                finishAsFailed(exp);
                             }
-                        } else {
-                            finishAsFailed(exp);
+                        } catch (Throwable t) {
+                            finishWithUnexpectedFailure(t);
                         }
-                    } catch (Throwable t) {
-                        finishWithUnexpectedFailure(t);
                     }
-                }
-            });
+                });
+            }
         }
 
         void retry(Throwable failure) {
diff --git a/core/src/test/java/org/elasticsearch/action/support/replication/ShardReplicationTests.java b/core/src/test/java/org/elasticsearch/action/support/replication/ShardReplicationTests.java
@@ -66,6 +66,7 @@
 
 import java.io.IOException;
 import java.util.HashSet;
+import java.util.List;
 import java.util.Set;
 import java.util.concurrent.CountDownLatch;
 import java.util.concurrent.ExecutionException;
@@ -342,24 +343,21 @@ public void testRoutingToPrimary() {
 
         TransportReplicationAction<Request, Request, Response>.PrimaryPhase primaryPhase = action.new PrimaryPhase(request, listener);
         assertTrue(primaryPhase.checkBlocks());
+        primaryPhase.routeRequestOrPerformPrimaryActionLocally(shardRoutingTable.primaryShard());
         if (primaryNodeId.equals(clusterService.localNode().id())) {
             logger.info("--> primary is assigned locally, testing for execution");
-            primaryPhase.moveToPrimaryAction(shardRoutingTable.primaryShard());
             assertTrue("request failed to be processed on a local primary", request.processedOnPrimary.get());
             if (transport.capturedRequests().length > 0) {
                 assertIndexShardCounter(2);
             } else {
                 assertIndexShardCounter(1);
             }
         } else {
-            // The coordinating node says primary shard is on the local node, but the local node doesn' have it,
-            // We need to retry, something has changed in time between the coordination node received the request
-            // and the node holding the primary shard processing the write request.
-            // So we fail and retry (wait on a new cluster update or the timeout to expire) again from the coordinating node.
-            logger.info("--> primary is assigned to [{}], checking request is going to be retried at some point", primaryNodeId);
-            assertThat(clusterService.getListeners().size(), equalTo(0));
-            primaryPhase.moveToPrimaryAction(shardRoutingTable.primaryShard());
-            assertThat(clusterService.getListeners().size(), equalTo(1));
+            logger.info("--> primary is assigned to [{}], checking request forwarded", primaryNodeId);
+            final List<CapturingTransport.CapturedRequest> capturedRequests = transport.capturedRequestsByTargetNode().get(primaryNodeId);
+            assertThat(capturedRequests, notNullValue());
+            assertThat(capturedRequests.size(), equalTo(1));
+            assertThat(capturedRequests.get(0).action, equalTo("testAction"));
             assertIndexShardUninitialized();
         }
     }