Mappings: simplify dynamic mappings updates.

While dynamic mappings updates are using the same code path as updates from the API when applied on a data node since #10593, they were still using a different code path on the master node. This commit makes dynamic updates processed the same way as updates from the API, which also seems to do a better way at acknowledgements (I could not reproduce the ConcurrentDynamicTemplateTests failure anymore). It also adds more checks, like for instance that indexing on replicas should not trigger dynamic mapping updates since they should have been handled on the primary before. Close #10720
elastic · Apr 23, 2015 · c6cdf77 · c6cdf77
1 parent dbeb4aa
commit c6cdf77
Show file tree

Hide file tree

Showing 11 changed files with 201 additions and 423 deletions.
diff --git a/src/main/java/org/elasticsearch/action/bulk/TransportShardBulkAction.java b/src/main/java/org/elasticsearch/action/bulk/TransportShardBulkAction.java
@@ -52,6 +52,7 @@
 import org.elasticsearch.index.engine.DocumentAlreadyExistsException;
 import org.elasticsearch.index.engine.Engine;
 import org.elasticsearch.index.engine.VersionConflictEngineException;
+import org.elasticsearch.index.mapper.MapperService;
 import org.elasticsearch.index.mapper.Mapping;
 import org.elasticsearch.index.mapper.SourceToParse;
 import org.elasticsearch.index.shard.IndexShard;
@@ -352,23 +353,6 @@ <T extends ActionWriteResponse> T response() {
 
     }
 
-    private void applyMappingUpdate(IndexService indexService, String type, Mapping update) throws Throwable {
-        // HACK: Rivers seem to have something specific that triggers potential
-        // deadlocks when doing concurrent indexing. So for now they keep the
-        // old behaviour of updating mappings locally first and then
-        // asynchronously notifying the master
-        // this can go away when rivers are removed
-        final String indexName = indexService.index().name();
-        final String indexUUID = indexService.indexUUID();
-        if (indexName.equals(RiverIndexName.Conf.indexName(settings))) {
-            indexService.mapperService().merge(type, new CompressedString(update.toBytes()), true);
-            mappingUpdatedAction.updateMappingOnMaster(indexName, indexUUID, type, update, null);
-        } else {
-            mappingUpdatedAction.updateMappingOnMasterSynchronously(indexName, indexUUID, type, update);
-            indexService.mapperService().merge(type, new CompressedString(update.toBytes()), true);
-        }
-    }
-
     private WriteResult shardIndexOperation(BulkShardRequest request, IndexRequest indexRequest, ClusterState clusterState,
                                             IndexShard indexShard, IndexService indexService, boolean processed) throws Throwable {
 
@@ -392,20 +376,54 @@ private WriteResult shardIndexOperation(BulkShardRequest request, IndexRequest i
         Engine.IndexingOperation op;
         if (indexRequest.opType() == IndexRequest.OpType.INDEX) {
             Engine.Index index = indexShard.prepareIndex(sourceToParse, indexRequest.version(), indexRequest.versionType(), Engine.Operation.Origin.PRIMARY, request.canHaveDuplicates() || indexRequest.canHaveDuplicates());
-            if (index.parsedDoc().dynamicMappingsUpdate() != null) {
-                applyMappingUpdate(indexService, indexRequest.type(), index.parsedDoc().dynamicMappingsUpdate());
+            Mapping update = index.parsedDoc().dynamicMappingsUpdate();
+            if (update != null) {
+                final String indexName = indexService.index().name();
+                if (indexName.equals(RiverIndexName.Conf.indexName(settings))) {
+                    // With rivers, we have a chicken and egg problem if indexing
+                    // the _meta document triggers a mapping update. Because we would
+                    // like to validate the mapping update first, but on the other
+                    // hand putting the mapping would start the river, which expects
+                    // to find a _meta document
+                    // So we have no choice but to index first and send mappings afterwards
+                    MapperService mapperService = indexService.mapperService();
+                    mapperService.merge(indexRequest.type(), new CompressedString(update.toBytes()), true);
+                    indexShard.index(index);
+                    mappingUpdatedAction.updateMappingOnMasterAsynchronously(indexName, indexRequest.type(), update);
+                } else {
+                    mappingUpdatedAction.updateMappingOnMasterSynchronously(indexName, indexRequest.type(), update);
+                    indexShard.index(index);
+                }
+            } else {
+                indexShard.index(index);
             }
-            indexShard.index(index);
             version = index.version();
             op = index;
             created = index.created();
         } else {
             Engine.Create create = indexShard.prepareCreate(sourceToParse, indexRequest.version(), indexRequest.versionType(), Engine.Operation.Origin.PRIMARY,
                     request.canHaveDuplicates() || indexRequest.canHaveDuplicates(), indexRequest.autoGeneratedId());
-            if (create.parsedDoc().dynamicMappingsUpdate() != null) {
-                applyMappingUpdate(indexService, indexRequest.type(), create.parsedDoc().dynamicMappingsUpdate());
+            Mapping update = create.parsedDoc().dynamicMappingsUpdate();
+            if (update != null) {
+                final String indexName = indexService.index().name();
+                if (indexName.equals(RiverIndexName.Conf.indexName(settings))) {
+                    // With rivers, we have a chicken and egg problem if indexing
+                    // the _meta document triggers a mapping update. Because we would
+                    // like to validate the mapping update first, but on the other
+                    // hand putting the mapping would start the river, which expects
+                    // to find a _meta document
+                    // So we have no choice but to index first and send mappings afterwards
+                    MapperService mapperService = indexService.mapperService();
+                    mapperService.merge(indexRequest.type(), new CompressedString(update.toBytes()), true);
+                    indexShard.create(create);
+                    mappingUpdatedAction.updateMappingOnMasterAsynchronously(indexName, indexRequest.type(), update);
+                } else {
+                    mappingUpdatedAction.updateMappingOnMasterSynchronously(indexName, indexRequest.type(), update);
+                    indexShard.create(create);
+                }
+            } else {
+                indexShard.create(create);
             }
-            indexShard.create(create);
             version = create.version();
             op = create;
             created = true;
@@ -528,8 +546,9 @@ private UpdateResult shardUpdateOperation(ClusterState clusterState, BulkShardRe
 
 
     @Override
-    protected void shardOperationOnReplica(ReplicaOperationRequest shardRequest) {
-        IndexShard indexShard = indicesService.indexServiceSafe(shardRequest.shardId.getIndex()).shardSafe(shardRequest.shardId.id());
+    protected void shardOperationOnReplica(ReplicaOperationRequest shardRequest) throws Exception {
+        IndexService indexService = indicesService.indexServiceSafe(shardRequest.shardId.getIndex());
+        IndexShard indexShard = indexService.shardSafe(shardRequest.shardId.id());
         final BulkShardRequest request = shardRequest.request;
         for (int i = 0; i < request.items().length; i++) {
             BulkItemRequest item = request.items()[i];
@@ -544,11 +563,29 @@ protected void shardOperationOnReplica(ReplicaOperationRequest shardRequest) {
 
                     if (indexRequest.opType() == IndexRequest.OpType.INDEX) {
                         Engine.Index index = indexShard.prepareIndex(sourceToParse, indexRequest.version(), indexRequest.versionType(), Engine.Operation.Origin.REPLICA, request.canHaveDuplicates() || indexRequest.canHaveDuplicates());
+                        if (index.parsedDoc().dynamicMappingsUpdate() != null) {
+                            if (indexService.index().name().equals(RiverIndexName.Conf.indexName(settings))) {
+                                // mappings updates on the _river are not validated synchronously so we can't
+                                // assume they are here when indexing on a replica
+                                indexService.mapperService().merge(indexRequest.type(), new CompressedString(index.parsedDoc().dynamicMappingsUpdate().toBytes()), true);
+                            } else {
+                                throw new ElasticsearchIllegalStateException("Index operations on replicas should not trigger dynamic mappings updates: [" + index.parsedDoc().dynamicMappingsUpdate() + "]");
+                            }
+                        }
                         indexShard.index(index);
                     } else {
                         Engine.Create create = indexShard.prepareCreate(sourceToParse,
                                 indexRequest.version(), indexRequest.versionType(),
                                 Engine.Operation.Origin.REPLICA, request.canHaveDuplicates() || indexRequest.canHaveDuplicates(), indexRequest.autoGeneratedId());
+                        if (create.parsedDoc().dynamicMappingsUpdate() != null) {
+                            if (indexService.index().name().equals(RiverIndexName.Conf.indexName(settings))) {
+                                // mappings updates on the _river are not validated synchronously so we can't
+                                // assume they are here when indexing on a replica
+                                indexService.mapperService().merge(indexRequest.type(), new CompressedString(create.parsedDoc().dynamicMappingsUpdate().toBytes()), true);
+                            } else {
+                                throw new ElasticsearchIllegalStateException("Index operations on replicas should not trigger dynamic mappings updates: [" + create.parsedDoc().dynamicMappingsUpdate() + "]");
+                            }
+                        }
                         indexShard.create(create);
                     }
                 } catch (Throwable e) {

diff --git a/src/main/java/org/elasticsearch/action/index/TransportIndexAction.java b/src/main/java/org/elasticsearch/action/index/TransportIndexAction.java
@@ -19,6 +19,7 @@
 
 package org.elasticsearch.action.index;
 
+import org.elasticsearch.ElasticsearchIllegalStateException;
 import org.elasticsearch.ExceptionsHelper;
 import org.elasticsearch.action.ActionListener;
 import org.elasticsearch.action.RoutingMissingException;
@@ -42,6 +43,7 @@
 import org.elasticsearch.common.settings.Settings;
 import org.elasticsearch.index.IndexService;
 import org.elasticsearch.index.engine.Engine;
+import org.elasticsearch.index.mapper.MapperService;
 import org.elasticsearch.index.mapper.Mapping;
 import org.elasticsearch.index.mapper.SourceToParse;
 import org.elasticsearch.index.shard.IndexShard;
@@ -51,6 +53,8 @@
 import org.elasticsearch.threadpool.ThreadPool;
 import org.elasticsearch.transport.TransportService;
 
+import java.io.IOException;
+
 /**
  * Performs the index operation.
  * <p/>
@@ -167,23 +171,6 @@ protected ShardIterator shards(ClusterState clusterState, InternalRequest reques
                 .indexShards(clusterService.state(), request.concreteIndex(), request.request().type(), request.request().id(), request.request().routing());
     }
 
-    private void applyMappingUpdate(IndexService indexService, String type, Mapping update) throws Throwable {
-        // HACK: Rivers seem to have something specific that triggers potential
-        // deadlocks when doing concurrent indexing. So for now they keep the
-        // old behaviour of updating mappings locally first and then
-        // asynchronously notifying the master
-        // this can go away when rivers are removed
-        final String indexName = indexService.index().name();
-        final String indexUUID = indexService.indexUUID();
-        if (indexName.equals(RiverIndexName.Conf.indexName(settings))) {
-            indexService.mapperService().merge(type, new CompressedString(update.toBytes()), true);
-            mappingUpdatedAction.updateMappingOnMaster(indexName, indexUUID, type, update, null);
-        } else {
-            mappingUpdatedAction.updateMappingOnMasterSynchronously(indexName, indexUUID, type, update);
-            indexService.mapperService().merge(type, new CompressedString(update.toBytes()), true);
-        }
-    }
-
     @Override
     protected Tuple<IndexResponse, IndexRequest> shardOperationOnPrimary(ClusterState clusterState, PrimaryOperationRequest shardRequest) throws Throwable {
         final IndexRequest request = shardRequest.request;
@@ -206,19 +193,53 @@ protected Tuple<IndexResponse, IndexRequest> shardOperationOnPrimary(ClusterStat
 
         if (request.opType() == IndexRequest.OpType.INDEX) {
             Engine.Index index = indexShard.prepareIndex(sourceToParse, request.version(), request.versionType(), Engine.Operation.Origin.PRIMARY, request.canHaveDuplicates());
-            if (index.parsedDoc().dynamicMappingsUpdate() != null) {
-                applyMappingUpdate(indexService, request.type(), index.parsedDoc().dynamicMappingsUpdate());
+            Mapping update = index.parsedDoc().dynamicMappingsUpdate();
+            if (update != null) {
+                final String indexName = indexService.index().name();
+                if (indexName.equals(RiverIndexName.Conf.indexName(settings))) {
+                    // With rivers, we have a chicken and egg problem if indexing
+                    // the _meta document triggers a mapping update. Because we would
+                    // like to validate the mapping update first, but on the other
+                    // hand putting the mapping would start the river, which expects
+                    // to find a _meta document
+                    // So we have no choice but to index first and send mappings afterwards
+                    MapperService mapperService = indexService.mapperService();
+                    mapperService.merge(request.type(), new CompressedString(update.toBytes()), true);
+                    indexShard.index(index);
+                    mappingUpdatedAction.updateMappingOnMasterAsynchronously(indexName, request.type(), update);
+                } else {
+                    mappingUpdatedAction.updateMappingOnMasterSynchronously(indexName, request.type(), update);
+                    indexShard.index(index);
+                }
+            } else {
+                indexShard.index(index);
             }
-            indexShard.index(index);
             version = index.version();
             created = index.created();
         } else {
             Engine.Create create = indexShard.prepareCreate(sourceToParse,
                     request.version(), request.versionType(), Engine.Operation.Origin.PRIMARY, request.canHaveDuplicates(), request.autoGeneratedId());
-            if (create.parsedDoc().dynamicMappingsUpdate() != null) {
-                applyMappingUpdate(indexService, request.type(), create.parsedDoc().dynamicMappingsUpdate());
+            Mapping update = create.parsedDoc().dynamicMappingsUpdate();
+            if (update != null) {
+                final String indexName = indexService.index().name();
+                if (indexName.equals(RiverIndexName.Conf.indexName(settings))) {
+                    // With rivers, we have a chicken and egg problem if indexing
+                    // the _meta document triggers a mapping update. Because we would
+                    // like to validate the mapping update first, but on the other
+                    // hand putting the mapping would start the river, which expects
+                    // to find a _meta document
+                    // So we have no choice but to index first and send mappings afterwards
+                    MapperService mapperService = indexService.mapperService();
+                    mapperService.merge(request.type(), new CompressedString(update.toBytes()), true);
+                    indexShard.create(create);
+                    mappingUpdatedAction.updateMappingOnMasterAsynchronously(indexName, request.type(), update);
+                } else {
+                    mappingUpdatedAction.updateMappingOnMasterSynchronously(indexName, request.type(), update);
+                    indexShard.create(create);
+                }
+            } else {
+                indexShard.create(create);
             }
-            indexShard.create(create);
             version = create.version();
             created = true;
         }
@@ -239,17 +260,36 @@ protected Tuple<IndexResponse, IndexRequest> shardOperationOnPrimary(ClusterStat
     }
 
     @Override
-    protected void shardOperationOnReplica(ReplicaOperationRequest shardRequest) {
-        IndexShard indexShard = indicesService.indexServiceSafe(shardRequest.shardId.getIndex()).shardSafe(shardRequest.shardId.id());
+    protected void shardOperationOnReplica(ReplicaOperationRequest shardRequest) throws IOException {
+        IndexService indexService = indicesService.indexServiceSafe(shardRequest.shardId.getIndex());
+        IndexShard indexShard = indexService.shardSafe(shardRequest.shardId.id());
         IndexRequest request = shardRequest.request;
         SourceToParse sourceToParse = SourceToParse.source(SourceToParse.Origin.REPLICA, request.source()).type(request.type()).id(request.id())
                 .routing(request.routing()).parent(request.parent()).timestamp(request.timestamp()).ttl(request.ttl());
         if (request.opType() == IndexRequest.OpType.INDEX) {
             Engine.Index index = indexShard.prepareIndex(sourceToParse, request.version(), request.versionType(), Engine.Operation.Origin.REPLICA, request.canHaveDuplicates());
+            if (index.parsedDoc().dynamicMappingsUpdate() != null) {
+                if (indexService.index().name().equals(RiverIndexName.Conf.indexName(settings))) {
+                    // mappings updates on the _river are not validated synchronously so we can't
+                    // assume they are here when indexing on a replica
+                    indexService.mapperService().merge(request.type(), new CompressedString(index.parsedDoc().dynamicMappingsUpdate().toBytes()), true);
+                } else {
+                    throw new ElasticsearchIllegalStateException("Index operations on replicas should not trigger dynamic mappings updates: [" + index.parsedDoc().dynamicMappingsUpdate() + "]");
+                }
+            }
             indexShard.index(index);
         } else {
             Engine.Create create = indexShard.prepareCreate(sourceToParse,
                     request.version(), request.versionType(), Engine.Operation.Origin.REPLICA, request.canHaveDuplicates(), request.autoGeneratedId());
+            if (create.parsedDoc().dynamicMappingsUpdate() != null) {
+                if (indexService.index().name().equals(RiverIndexName.Conf.indexName(settings))) {
+                    // mappings updates on the _river are not validated synchronously so we can't
+                    // assume they are here when indexing on a replica
+                    indexService.mapperService().merge(request.type(), new CompressedString(create.parsedDoc().dynamicMappingsUpdate().toBytes()), true);
+                } else {
+                    throw new ElasticsearchIllegalStateException("Index operations on replicas should not trigger dynamic mappings updates: [" + create.parsedDoc().dynamicMappingsUpdate() + "]");
+                }
+            }
             indexShard.create(create);
         }
         if (request.refresh()) {

diff --git a/...rg/elasticsearch/action/support/replication/TransportShardReplicationOperationAction.java b/...rg/elasticsearch/action/support/replication/TransportShardReplicationOperationAction.java
@@ -117,7 +117,7 @@ protected void doExecute(Request request, ActionListener<Response> listener) {
      */
     protected abstract Tuple<Response, ReplicaRequest> shardOperationOnPrimary(ClusterState clusterState, PrimaryOperationRequest shardRequest)  throws Throwable;
 
-    protected abstract void shardOperationOnReplica(ReplicaOperationRequest shardRequest);
+    protected abstract void shardOperationOnReplica(ReplicaOperationRequest shardRequest) throws Exception;
 
     protected abstract ShardIterator shards(ClusterState clusterState, InternalRequest request) throws ElasticsearchException;