apache · reschke · Feb 21, 2024 · Feb 21, 2024 · Feb 21, 2024 · Feb 21, 2024
diff --git a/oak-jcr/src/test/java/org/apache/jackrabbit/oak/jcr/ManyChildrenIT.java b/oak-jcr/src/test/java/org/apache/jackrabbit/oak/jcr/ManyChildrenIT.java
@@ -82,7 +82,7 @@ public void addRemoveNodes() throws Exception {
     }
 
     @Test
-    @Ignore //OAK-10646
+    // @Ignore //OAK-10646
     public void orderableAddManyChildrenWithSave() throws Exception {
         int childCount = 1000;
         StringBuilder prefix = new StringBuilder("");
@@ -98,7 +98,7 @@ public void orderableAddManyChildrenWithSave() throws Exception {
     }
 
     @Test
-    @Ignore //OAK-10646
+    // @Ignore //OAK-10646
     public void moveOrderableWithManyChildren() throws Exception {
         int childCount = 1000;
         int moveCount = 1;
@@ -121,7 +121,7 @@ public void moveOrderableWithManyChildren() throws Exception {
     }
 
     @Test
-    @Ignore //OAK-10646
+    // @Ignore //OAK-10646
     public void copyOrderableWithManyChildren() throws Exception {
         int childCount = 1000;
         int copyCount = 1;

diff --git a/.../src/main/java/org/apache/jackrabbit/oak/plugins/document/memory/MemoryDocumentStore.java b/.../src/main/java/org/apache/jackrabbit/oak/plugins/document/memory/MemoryDocumentStore.java
@@ -51,6 +51,8 @@
 import org.apache.jackrabbit.oak.plugins.document.util.Utils;
 import org.jetbrains.annotations.NotNull;
 import org.jetbrains.annotations.Nullable;
+import org.slf4j.Logger;
+import org.slf4j.LoggerFactory;
 
 import com.mongodb.ReadPreference;
 import com.mongodb.WriteConcern;
@@ -101,6 +103,8 @@ public class MemoryDocumentStore implements DocumentStore {
 
     private static final long SIZE_LIMIT = SystemPropertySupplier.create("memoryds.size.limit", -1).get();
 
+    private static final Logger LOG = LoggerFactory.getLogger(MemoryDocumentStore.class); 
+
     public MemoryDocumentStore() {
         this(false);
     }
@@ -341,7 +345,22 @@ private <T extends Document> T internalCreateOrUpdate(Collection<T> collection,
             // update the document
             UpdateUtils.applyChanges(doc, update);
             maintainModCount(doc);
-            checkSize(doc);
+            try {
+                checkSize(doc);
+            } catch (DocumentStoreException ex) {
+                // slightly hacky approach to find "our" cluster id
+                if (update.hasChanges()) {
+                    final int clusterid = Utils.extractClusterId(update);
+                    UpdateOp shrink = Utils.getShrinkOp(doc, ":childOrder", r -> r.getClusterId() == clusterid);
+                    // try cleanup and then retry once
+                    long before = doc.getMemory();
+                    UpdateUtils.applyChanges(doc, shrink);
+                    long after = doc.getMemory();
+                    LOG.info("Doc size was exceeded for {}:  {} bytes. Applied shrink ops: {}. New size: {}. Doing one retry.",
+                            doc.getId(), before, shrink, after);
+                }
+                checkSize(doc);
+            }
             doc.seal();
             map.put(update.getId(), doc);
             return oldDoc;
@@ -474,7 +493,10 @@ public long determineServerTimeDifferenceMillis() {
         return 0;
     }
 
-    private void checkSize(Document doc) {
+    /**
+     * aborts the operation if a size limit is configured and exceeded
+     */
+    private void checkSize(Document doc) throws DocumentStoreException {
         if (SIZE_LIMIT >= 0) {
             int size = doc.getMemory();
             if (size >= SIZE_LIMIT) {

diff --git a/oak-store-document/src/main/java/org/apache/jackrabbit/oak/plugins/document/util/Utils.java b/oak-store-document/src/main/java/org/apache/jackrabbit/oak/plugins/document/util/Utils.java
@@ -26,6 +26,7 @@
 import java.time.Instant;
 import java.time.format.DateTimeFormatter;
 import java.util.ArrayList;
+import java.util.Collections;
 import java.util.Comparator;
 import java.util.Date;
 import java.util.Iterator;
@@ -46,6 +47,7 @@
 import org.apache.jackrabbit.oak.plugins.document.ClusterNodeInfo;
 import org.apache.jackrabbit.oak.plugins.document.ClusterNodeInfoDocument;
 import org.apache.jackrabbit.oak.plugins.document.Collection;
+import org.apache.jackrabbit.oak.plugins.document.Document;
 import org.apache.jackrabbit.oak.plugins.document.DocumentNodeStoreBuilder;
 import org.apache.jackrabbit.oak.plugins.document.DocumentStore;
 import org.apache.jackrabbit.oak.plugins.document.DocumentStoreException;
@@ -54,6 +56,8 @@
 import org.apache.jackrabbit.oak.plugins.document.Revision;
 import org.apache.jackrabbit.oak.plugins.document.RevisionVector;
 import org.apache.jackrabbit.oak.plugins.document.StableRevisionComparator;
+import org.apache.jackrabbit.oak.plugins.document.UpdateOp;
+import org.apache.jackrabbit.oak.plugins.document.UpdateOp.Key;
 import org.apache.jackrabbit.oak.spi.toggle.Feature;
 import org.apache.jackrabbit.oak.stats.Clock;
 import org.jetbrains.annotations.NotNull;
@@ -274,6 +278,73 @@ private static String diagsForEntry(Map.Entry<String, PropertyStats> member) {
         }
     }
 
+    /**
+     * @return cluster if from first revision found in op, {@code -1} otherwise
+     */
+    public static int extractClusterId(UpdateOp op) {
+        for (Key key : op.getChanges().keySet()) {
+            if (key.getRevision() != null) {
+                return key.getRevision().getClusterId();
+            }
+        }
+        return -1;
+    }
+
+    /**
+     * Produce an {@link UpdateOp} suitable for shrinking branch revision entries for given property in {@link Document}, {@code null} otherwise.
+     * 
+     * @param doc document to inspect for repeated branch commits
+     * @param propertName property to check for
+     * @param revisionChecker filter for revisions (for instance, to check for cluster id)
+     * @return {@link UpdateOp} suitable for shrinking document, {@code null} otherwise
+     */
+    public static @Nullable UpdateOp getShrinkOp(Document doc, String propertyName, Predicate<Revision> revisionChecker) {
+        Object t_bc = doc.get("_bc");
+        Object t_property = doc.get(propertyName);
+        if (t_bc instanceof Map && t_property instanceof Map) {
+            @SuppressWarnings("unchecked")
+            Map<Revision, String> _bc = (Map<Revision, String>)t_bc;
+            @SuppressWarnings("unchecked")
+            Map<Revision, String> pMap = (Map<Revision, String>)t_property;
+            List<Revision> revs = new ArrayList<>();
+            for (Map.Entry<Revision, String> en : pMap.entrySet()) {
+                Revision r = en.getKey();
+                if (revisionChecker.apply(r)) {
+                    String bcv = _bc.get(r);
+                    if ("true".equals(bcv)) {
+                        revs.add(r);
+                    }
+                }
+            }
+            // sort by age
+            Collections.sort(revs, new Comparator<Revision>() {
+                @Override
+                public int compare(Revision r1, Revision r2) {
+                    if (r1.getClusterId() != r2.getClusterId()) {
+                        return r1.getClusterId() - r2.getClusterId();
+                    } else if (r1.getTimestamp() != r2.getTimestamp()) {
+                        return r1.getTimestamp() > r2.getTimestamp() ? 1 : -1;
+                    } else {
+                        return r1.getCounter() - r2.getCounter();
+                    }
+                }});
-            Collections.sort(revs, new Comparator<Revision>() {
-                @Override
-                public int compare(Revision r1, Revision r2) {
-                    if (r1.getClusterId() != r2.getClusterId()) {
-                        return r1.getClusterId() - r2.getClusterId();
-                    } else if (r1.getTimestamp() != r2.getTimestamp()) {
-                        return r1.getTimestamp() > r2.getTimestamp() ? 1 : -1;
-                    } else {
-                        return r1.getCounter() - r2.getCounter();
-                    }
-                }});
+            revs.sort((c1, c2) -> Comparator.comparing(Revision::getClusterId).thenComparing(Revision::getTimestamp).thenComparing(Revision::getCounter).compare(c1, c2));
-            Collections.sort(revs, new Comparator<Revision>() {
-                @Override
-                public int compare(Revision r1, Revision r2) {
-                    if (r1.getClusterId() != r2.getClusterId()) {
-                        return r1.getClusterId() - r2.getClusterId();
-                    } else if (r1.getTimestamp() != r2.getTimestamp()) {
-                        return r1.getTimestamp() > r2.getTimestamp() ? 1 : -1;
-                    } else {
-                        return r1.getCounter() - r2.getCounter();
-                    }
-                }});
+            revs.sort((c1, c2) -> Comparator.comparing(Revision::getClusterId).thenComparing(Revision::getTimestamp).thenComparing(Revision::getCounter).compare(c1, c2));
+
+            UpdateOp clean = new UpdateOp(doc.getId(), false);
+            Revision last = null;
+            for (Revision r : revs) {
+                if (last != null) {
+                    if (last.getClusterId() == r.getClusterId()) {
+                        clean.removeMapEntry(propertyName, last);
+                    }
+                }
+                last = r;
+            }
+            return clean.hasChanges() ? clean : null;
+        } else {
+            return null;
+        }
+    }
+
     /**
      * List of property names that are system-defined by JCR and thus do not
      * need to be redacted (to be expanded later)