opendistro-for-elasticsearch · ktkrg · Aug 31, 2020 · Aug 3, 2020 · Aug 3, 2020 · Aug 6, 2020
diff --git a/.../amazon/opendistro/elasticsearch/performanceanalyzer/decisionmaker/deciders/Collator.java b/.../amazon/opendistro/elasticsearch/performanceanalyzer/decisionmaker/deciders/Collator.java
diff --git a/...amazon/opendistro/elasticsearch/performanceanalyzer/decisionmaker/deciders/Publisher.java b/...amazon/opendistro/elasticsearch/performanceanalyzer/decisionmaker/deciders/Publisher.java
@@ -20,19 +20,18 @@
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.actions.ActionListener;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.actions.FlipFlopDetector;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.actions.TimedFlipFlopDetector;
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.collator.Collator;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.rca.framework.core.NonLeafNode;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.rca.framework.metrics.ExceptionsAndErrors;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.rca.framework.metrics.RcaGraphMetrics;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.rca.scheduler.FlowUnitOperationArgWrapper;
 import com.google.common.annotations.VisibleForTesting;
-
 import java.time.Instant;
 import java.util.ArrayList;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
 import java.util.concurrent.TimeUnit;
-
 import org.apache.logging.log4j.LogManager;
 import org.apache.logging.log4j.Logger;
 

diff --git a/...stro/elasticsearch/performanceanalyzer/decisionmaker/deciders/collator/ActionGrouper.java b/...stro/elasticsearch/performanceanalyzer/decisionmaker/deciders/collator/ActionGrouper.java
@@ -0,0 +1,37 @@
+/*
+ * Copyright 2020 Amazon.com, Inc. or its affiliates. All Rights Reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License").
+ * You may not use this file except in compliance with the License.
+ * A copy of the License is located at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * or in the "license" file accompanying this file. This file is distributed
+ * on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
+ * express or implied. See the License for the specific language governing
+ *  permissions and limitations under the License.
+ */
+
+package com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.collator;
+
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.actions.Action;
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.rca.store.rca.cluster.NodeKey;
+import java.util.List;
+import java.util.Map;
+import org.checkerframework.checker.nullness.qual.NonNull;
+
+/**
+ * A grouping interface to provide different ways to group actions as needed by the {@link
+ * Collator}
+ */
+public interface ActionGrouper {
+
+  /**
+   * Groups the given list of actions by the nodes they impact.
+   *
+   * @param actions The list of actions that need to be grouped.
+   * @return A map of actions grouped by nodes they impact.
+   */
+  @NonNull Map<NodeKey, List<Action>> groupByInstanceId(@NonNull final List<Action> actions);
+}
diff --git a/...pendistro/elasticsearch/performanceanalyzer/decisionmaker/deciders/collator/Collator.java b/...pendistro/elasticsearch/performanceanalyzer/decisionmaker/deciders/collator/Collator.java
@@ -0,0 +1,148 @@
+/*
+ * Copyright 2020 Amazon.com, Inc. or its affiliates. All Rights Reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License").
+ * You may not use this file except in compliance with the License.
+ * A copy of the License is located at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * or in the "license" file accompanying this file. This file is distributed
+ * on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
+ * express or implied. See the License for the specific language governing
+ *  permissions and limitations under the License.
+ */
+
+package com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.collator;
+
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.actions.Action;
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.actions.ImpactVector;
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.actions.ImpactVector.Impact;
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.Decider;
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.Decision;
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.rca.framework.api.AnalysisGraph;
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.rca.store.rca.cluster.NodeKey;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.List;
+import java.util.Map;
+import org.checkerframework.checker.nullness.qual.NonNull;
+
+/**
+ * Collator collects and prunes the candidate decisions from each decider so that their impacts are
+ * aligned.
+ *
+ * <p>Decisions can increase or decrease pressure on different key resources on an Elasticearch
+ * node. This is encapsulated in each Action via the {@link ImpactVector}. Since each decider
+ * independently evaluates its decision, it is possible to have conflicting ImpactVectors from
+ * actions across deciders.
+ *
+ * <p>The collator prunes them to ensure we only take actions that either increase, or decrease
+ * pressure on a particular node. To resolve conflicts, we prefer stability over performance. In
+ * order for the above guarantee to work, there should be only one collator instance in an {@link
+ * AnalysisGraph}.
+ */
+public class Collator extends Decider {
+
+  public static final String NAME = "collator";
+
+  /* Deciders can choose to publish decisions at different frequencies based on the
+   * type of resources monitored and rca signals. The collator should however, not introduce any
+   * unnecessary delays. As soon as a decision is taken, it should be evaluated and published downstream.
+   */
+  private static final int collatorFrequency = 1; // Measured in terms of number of evaluationIntervalPeriods
+
+  private static final int evalIntervalSeconds = 5;
+
+  private final List<Decider> deciders;
+
+  private final ActionGrouper actionGrouper;
+
+  public Collator(Decider... deciders) {
+    this(new SingleNodeImpactActionGrouper(), deciders);
+  }
+
+  public Collator(ActionGrouper actionGrouper, Decider... deciders) {
+    super(evalIntervalSeconds, collatorFrequency);
+    this.deciders = Arrays.asList(deciders);
+    this.actionGrouper = actionGrouper;
+  }
+
+  @Override
+  public String name() {
+    return NAME;
+  }
+
+  /**
+   * The collator uses an action grouping strategy to first group actions by instanceIds. Then, the
+   * collator polarizes the list of actions per instance to be in the same direction of pressure,
+   * i.e. all the polarized actions either increase pressure on a node, or decrease pressure on a
+   * node.
+   *
+   * <p>When there are conflicting actions suggested by the deciders for an instance, the
+   * polarization logic prefers pruning actions that decrease stability retaining only those that
+   * increase stability. </p>
+   *
+   * @return A {@link Decision} instance that contains the list of polarized actions.
+   */
+  @Override
+  public Decision operate() {
+    final List<Action> proposedActions = getAllProposedActions();
+    final Map<NodeKey, List<Action>> actionsByNode = actionGrouper
+        .groupByInstanceId(proposedActions);
+    final List<Action> prunedActions = new ArrayList<>();
+    actionsByNode.forEach((nodeKey, actions) -> prunedActions.addAll(polarize(nodeKey, actions)));
+
+    final Decision finalDecision = new Decision(System.currentTimeMillis(), NAME);
+    finalDecision.addAllActions(prunedActions);
+    return finalDecision;
+  }
+
+  @NonNull
+  private List<Action> getAllProposedActions() {
+    final List<Action> proposedActions = new ArrayList<>();
+    if (deciders != null) {
+      for (final Decider decider : deciders) {
+        List<Decision> decisions = decider.getFlowUnits();
+        if (decisions != null) {
+          decisions.forEach(decision -> {
+            if (decision.getActions() != null) {
+              proposedActions.addAll(decision.getActions());
+            }
+          });
+        }
+      }
+    }
+    return proposedActions;
+  }
+
+  private List<Action> polarize(final NodeKey nodeKey, final List<Action> actions) {
+    final List<Action> pressureIncreasingActions = new ArrayList<>();
+    final List<Action> pressureNonIncreasingActions = new ArrayList<>();
+
+    for (final Action action : actions) {
+      ImpactVector impactVector = action.impact().getOrDefault(nodeKey, new ImpactVector());
+
+      // Classify the action as pressure increasing action if the impact for any dimension is
+      // increasing pressure.
+      if (impactVector.getImpact()
+                      .values()
+                      .stream()
+                      .anyMatch(impact -> impact == Impact.INCREASES_PRESSURE)) {
+        pressureIncreasingActions.add(action);
+      } else {
+        pressureNonIncreasingActions.add(action);
+      }
+    }
+
+    // If there are any actions that decrease pressure for a node, prefer that over list of
+    // actions that increase pressure.
+    if (pressureNonIncreasingActions.size() > 0) {
+      return pressureNonIncreasingActions;
+    }
+
+    // Return list of actions that increase pressure only if no decider has proposed an action
+    // that will relieve pressure for this node.
+    return pressureIncreasingActions;
+  }
+}
diff --git a/...ch/performanceanalyzer/decisionmaker/deciders/collator/SingleNodeImpactActionGrouper.java b/...ch/performanceanalyzer/decisionmaker/deciders/collator/SingleNodeImpactActionGrouper.java
@@ -0,0 +1,50 @@
+/*
+ * Copyright 2020 Amazon.com, Inc. or its affiliates. All Rights Reserved.
+ *
+ * Licensed under the Apache License, Version 2.0 (the "License").
+ * You may not use this file except in compliance with the License.
+ * A copy of the License is located at
+ *
+ *      http://www.apache.org/licenses/LICENSE-2.0
+ *
+ * or in the "license" file accompanying this file. This file is distributed
+ * on an "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either
+ * express or implied. See the License for the specific language governing
+ *  permissions and limitations under the License.
+ */
+
+package com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.collator;
+
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.actions.Action;
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.rca.store.rca.cluster.NodeKey;
+import java.util.ArrayList;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+import org.checkerframework.checker.nullness.qual.NonNull;
+
+public class SingleNodeImpactActionGrouper implements ActionGrouper {
+
+  /**
+   * Groups actions by instance they impact. This grouping method considers only those actions that
+   * impact a single node as valid candidates for grouping and as a result it filters out actions
+   * that impact multiple nodes.
+   *
+   * <p>Any action that impacts more than one node will need a more involved handling logic and
+   * this method is not to be used for grouping such actions.</p>
+   *
+   * @param actions The list of actions that need to be grouped.
+   * @return A map of actions grouped by instance they impact.
+   */
+  @Override
+  @NonNull
+  public Map<NodeKey, List<Action>> groupByInstanceId(@NonNull List<Action> actions) {
+    final Map<NodeKey, List<Action>> actionsByNodeId = new HashMap<>();
+    actions.stream()
+           .filter(action -> action.impactedNodes().size() == 1)
+           .forEach(action -> actionsByNodeId.computeIfAbsent(action.impactedNodes()
+                                                                    .get(0), k -> new ArrayList<>())
+                                             .add(action));
+    return actionsByNodeId;
+  }
+}
diff --git a/...on/opendistro/elasticsearch/performanceanalyzer/rca/store/ElasticSearchAnalysisGraph.java b/...on/opendistro/elasticsearch/performanceanalyzer/rca/store/ElasticSearchAnalysisGraph.java
@@ -22,9 +22,9 @@
 import static com.amazon.opendistro.elasticsearch.performanceanalyzer.rca.framework.util.RcaConsts.RcaTagConstants.TAG_LOCUS;
 
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.CacheHealthDecider;
-import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.Collator;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.Publisher;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.QueueHealthDecider;
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.collator.Collator;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.metrics.AllMetrics.CommonDimension;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.metrics.AllMetrics.ShardStatsDerivedDimension;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.metricsdb.MetricsDB;
@@ -103,7 +103,6 @@
 import java.util.Arrays;
 import java.util.Collections;
 import java.util.List;
-
 import org.apache.logging.log4j.LogManager;
 import org.apache.logging.log4j.Logger;
 
@@ -274,7 +273,7 @@ public void construct() {
     //constructResourceHeatMapGraph();
 
     // Collator - Collects actions from all deciders and aligns impact vectors
-    Collator collator = new Collator(EVALUATION_INTERVAL_SECONDS, queueHealthDecider, cacheHealthDecider);
+    Collator collator = new Collator(queueHealthDecider, cacheHealthDecider);
     collator.addTag(TAG_LOCUS, LOCUS_MASTER_NODE);
     collator.addAllUpstreams(Arrays.asList(queueHealthDecider, cacheHealthDecider));
 

diff --git a/...on/opendistro/elasticsearch/performanceanalyzer/decisionmaker/deciders/PublisherTest.java b/...on/opendistro/elasticsearch/performanceanalyzer/decisionmaker/deciders/PublisherTest.java
@@ -19,20 +19,18 @@
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.actions.ActionListener;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.actions.ImpactVector;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.actions.ImpactVector.Dimension;
+import com.amazon.opendistro.elasticsearch.performanceanalyzer.decisionmaker.deciders.collator.Collator;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.plugins.Plugin;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.rca.framework.util.InstanceDetails;
 import com.amazon.opendistro.elasticsearch.performanceanalyzer.rca.store.rca.cluster.NodeKey;
 import com.google.common.collect.Lists;
-
 import java.time.Instant;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.List;
 import java.util.Map;
-
 import org.junit.Before;
 import org.junit.Test;
-
 import org.mockito.Mock;
 import org.mockito.Mockito;
 import org.mockito.MockitoAnnotations;