scalar-labs · brfrn169 · Jun 20, 2025 · Jun 12, 2025 · Jun 20, 2025 · Jun 20, 2025
diff --git a/core/src/main/java/com/scalar/db/transaction/consensuscommit/CommitHandler.java b/core/src/main/java/com/scalar/db/transaction/consensuscommit/CommitHandler.java
@@ -2,9 +2,9 @@
 
 import static com.google.common.base.Preconditions.checkNotNull;
 
-import com.google.common.collect.ImmutableList;
 import com.google.errorprone.annotations.concurrent.LazyInit;
 import com.scalar.db.api.DistributedStorage;
+import com.scalar.db.api.Mutation;
 import com.scalar.db.api.TransactionState;
 import com.scalar.db.common.CoreError;
 import com.scalar.db.exception.storage.ExecutionException;
@@ -36,6 +36,7 @@ public class CommitHandler {
   protected final Coordinator coordinator;
   private final TransactionTableMetadataManager tableMetadataManager;
   private final ParallelExecutor parallelExecutor;
+  private final MutationsGrouper mutationsGrouper;
   protected final boolean coordinatorWriteOmissionOnReadOnlyEnabled;
 
   @LazyInit @Nullable private BeforePreparationSnapshotHook beforePreparationSnapshotHook;
@@ -46,11 +47,13 @@ public CommitHandler(
       Coordinator coordinator,
       TransactionTableMetadataManager tableMetadataManager,
       ParallelExecutor parallelExecutor,
+      MutationsGrouper mutationsGrouper,
       boolean coordinatorWriteOmissionOnReadOnlyEnabled) {
     this.storage = checkNotNull(storage);
     this.coordinator = checkNotNull(coordinator);
     this.tableMetadataManager = checkNotNull(tableMetadataManager);
     this.parallelExecutor = checkNotNull(parallelExecutor);
+    this.mutationsGrouper = checkNotNull(mutationsGrouper);
     this.coordinatorWriteOmissionOnReadOnlyEnabled = coordinatorWriteOmissionOnReadOnlyEnabled;
   }
 
@@ -199,12 +202,11 @@ public void prepareRecords(Snapshot snapshot) throws PreparationException {
       PrepareMutationComposer composer =
           new PrepareMutationComposer(snapshot.getId(), tableMetadataManager);
       snapshot.to(composer);
-      PartitionedMutations mutations = new PartitionedMutations(composer.get());
+      List<List<Mutation>> groupedMutations = mutationsGrouper.groupMutations(composer.get());
 
-      ImmutableList<PartitionedMutations.Key> orderedKeys = mutations.getOrderedKeys();
-      List<ParallelExecutorTask> tasks = new ArrayList<>(orderedKeys.size());
-      for (PartitionedMutations.Key key : orderedKeys) {
-        tasks.add(() -> storage.mutate(mutations.get(key)));
+      List<ParallelExecutorTask> tasks = new ArrayList<>(groupedMutations.size());
+      for (List<Mutation> mutations : groupedMutations) {
+        tasks.add(() -> storage.mutate(mutations));
       }
       parallelExecutor.prepareRecords(tasks, snapshot.getId());
     } catch (NoMutationException e) {
@@ -252,12 +254,11 @@ public void commitRecords(Snapshot snapshot) {
       CommitMutationComposer composer =
           new CommitMutationComposer(snapshot.getId(), tableMetadataManager);
       snapshot.to(composer);
-      PartitionedMutations mutations = new PartitionedMutations(composer.get());
+      List<List<Mutation>> groupedMutations = mutationsGrouper.groupMutations(composer.get());
 
-      ImmutableList<PartitionedMutations.Key> orderedKeys = mutations.getOrderedKeys();
-      List<ParallelExecutorTask> tasks = new ArrayList<>(orderedKeys.size());
-      for (PartitionedMutations.Key key : orderedKeys) {
-        tasks.add(() -> storage.mutate(mutations.get(key)));
+      List<ParallelExecutorTask> tasks = new ArrayList<>(groupedMutations.size());
+      for (List<Mutation> mutations : groupedMutations) {
+        tasks.add(() -> storage.mutate(mutations));
       }
       parallelExecutor.commitRecords(tasks, snapshot.getId());
     } catch (Exception e) {
@@ -300,12 +301,11 @@ public void rollbackRecords(Snapshot snapshot) {
       RollbackMutationComposer composer =
           new RollbackMutationComposer(snapshot.getId(), storage, tableMetadataManager);
       snapshot.to(composer);
-      PartitionedMutations mutations = new PartitionedMutations(composer.get());
+      List<List<Mutation>> groupedMutations = mutationsGrouper.groupMutations(composer.get());
 
-      ImmutableList<PartitionedMutations.Key> orderedKeys = mutations.getOrderedKeys();
-      List<ParallelExecutorTask> tasks = new ArrayList<>(orderedKeys.size());
-      for (PartitionedMutations.Key key : orderedKeys) {
-        tasks.add(() -> storage.mutate(mutations.get(key)));
+      List<ParallelExecutorTask> tasks = new ArrayList<>(groupedMutations.size());
+      for (List<Mutation> mutations : groupedMutations) {
+        tasks.add(() -> storage.mutate(mutations));
       }
       parallelExecutor.rollbackRecords(tasks, snapshot.getId());
     } catch (Exception e) {

diff --git a/...src/main/java/com/scalar/db/transaction/consensuscommit/CommitHandlerWithGroupCommit.java b/...src/main/java/com/scalar/db/transaction/consensuscommit/CommitHandlerWithGroupCommit.java
@@ -29,15 +29,16 @@ public CommitHandlerWithGroupCommit(
       Coordinator coordinator,
       TransactionTableMetadataManager tableMetadataManager,
       ParallelExecutor parallelExecutor,
+      MutationsGrouper mutationsGrouper,
       boolean coordinatorWriteOmissionOnReadOnlyEnabled,
       CoordinatorGroupCommitter groupCommitter) {
     super(
         storage,
         coordinator,
         tableMetadataManager,
         parallelExecutor,
+        mutationsGrouper,
         coordinatorWriteOmissionOnReadOnlyEnabled);
-
     checkNotNull(groupCommitter);
     // The methods of this emitter will be called via GroupCommitter.ready().
     groupCommitter.setEmitter(new Emitter(coordinator));

diff --git a/core/src/main/java/com/scalar/db/transaction/consensuscommit/ConsensusCommitManager.java b/core/src/main/java/com/scalar/db/transaction/consensuscommit/ConsensusCommitManager.java
@@ -23,6 +23,7 @@
 import com.scalar.db.common.AbstractDistributedTransactionManager;
 import com.scalar.db.common.AbstractTransactionManagerCrudOperableScanner;
 import com.scalar.db.common.ReadOnlyDistributedTransaction;
+import com.scalar.db.common.StorageInfoProvider;
 import com.scalar.db.config.DatabaseConfig;
 import com.scalar.db.exception.transaction.CommitConflictException;
 import com.scalar.db.exception.transaction.CrudConflictException;
@@ -133,12 +134,14 @@ protected ConsensusCommitManager(DatabaseConfig databaseConfig) {
 
   // `groupCommitter` must be set before calling this method.
   private CommitHandler createCommitHandler(ConsensusCommitConfig config) {
+    MutationsGrouper mutationsGrouper = new MutationsGrouper(new StorageInfoProvider(admin));
     if (isGroupCommitEnabled()) {
       return new CommitHandlerWithGroupCommit(
           storage,
           coordinator,
           tableMetadataManager,
           parallelExecutor,
+          mutationsGrouper,
           config.isCoordinatorWriteOmissionOnReadOnlyEnabled(),
           groupCommitter);
     } else {
@@ -147,6 +150,7 @@ private CommitHandler createCommitHandler(ConsensusCommitConfig config) {
           coordinator,
           tableMetadataManager,
           parallelExecutor,
+          mutationsGrouper,
           config.isCoordinatorWriteOmissionOnReadOnlyEnabled());
     }
   }

diff --git a/core/src/main/java/com/scalar/db/transaction/consensuscommit/MutationsGrouper.java b/core/src/main/java/com/scalar/db/transaction/consensuscommit/MutationsGrouper.java
@@ -0,0 +1,127 @@
+package com.scalar.db.transaction.consensuscommit;
+
+import com.scalar.db.api.Mutation;
+import com.scalar.db.api.StorageInfo;
+import com.scalar.db.common.StorageInfoProvider;
+import com.scalar.db.exception.storage.ExecutionException;
+import com.scalar.db.io.Key;
+import java.util.ArrayList;
+import java.util.Collection;
+import java.util.LinkedHashMap;
+import java.util.List;
+import java.util.Map;
+import java.util.Objects;
+import java.util.Optional;
+import java.util.stream.Collectors;
+import javax.annotation.Nullable;
+import javax.annotation.concurrent.ThreadSafe;
+
+@ThreadSafe
+public class MutationsGrouper {
+
+  private final StorageInfoProvider storageInfoProvider;
+
+  public MutationsGrouper(StorageInfoProvider storageInfoProvider) {
+    this.storageInfoProvider = storageInfoProvider;
+  }
+
+  public List<List<Mutation>> groupMutations(Collection<Mutation> mutations)
+      throws ExecutionException {
+    // MutationGroup mutations by their storage info and atomicity unit
+    Map<MutationGroup, List<List<Mutation>>> groupToBatches = new LinkedHashMap<>();
+
+    for (Mutation mutation : mutations) {
+      assert mutation.forNamespace().isPresent();
+      StorageInfo storageInfo = storageInfoProvider.getStorageInfo(mutation.forNamespace().get());
+
+      MutationGroup group = new MutationGroup(mutation, storageInfo);
+      List<List<Mutation>> batches = groupToBatches.computeIfAbsent(group, g -> new ArrayList<>());
+      int maxCount = group.storageInfo.getMaxAtomicMutationsCount();
+
+      if (batches.isEmpty() || batches.get(batches.size() - 1).size() >= maxCount) {
+        // If the last batch is full or there are no batches yet, create a new batch
+        batches.add(new ArrayList<>());
+      }
+
+      batches.get(batches.size() - 1).add(mutation);
+    }
+
+    // Flatten the grouped mutations into a single list of batches
+    return groupToBatches.values().stream().flatMap(List::stream).collect(Collectors.toList());
+  }
+
+  private static class MutationGroup {
+    public final StorageInfo storageInfo;
+    @Nullable public final String namespace;
+    @Nullable public final String table;
+    @Nullable public final Key partitionKey;
+    @Nullable public final Optional<Key> clusteringKey;
+
+    private MutationGroup(Mutation mutation, StorageInfo storageInfo) {
+      assert mutation.forNamespace().isPresent() && mutation.forTable().isPresent();
+
+      switch (storageInfo.getMutationAtomicityUnit()) {
+        case RECORD:
+          this.clusteringKey = mutation.getClusteringKey();
+          this.partitionKey = mutation.getPartitionKey();
+          this.table = mutation.forTable().get();
+          this.namespace = mutation.forNamespace().get();
+          this.storageInfo = storageInfo;
+          break;
+        case PARTITION:
+          this.clusteringKey = null;
+          this.partitionKey = mutation.getPartitionKey();
+          this.table = mutation.forTable().get();
+          this.namespace = mutation.forNamespace().get();
+          this.storageInfo = storageInfo;
+          break;
+        case TABLE:
+          this.clusteringKey = null;
+          this.partitionKey = null;
+          this.table = mutation.forTable().get();
+          this.namespace = mutation.forNamespace().get();
+          this.storageInfo = storageInfo;
+          break;
+        case NAMESPACE:
+          this.clusteringKey = null;
+          this.partitionKey = null;
+          this.table = null;
+          this.namespace = mutation.forNamespace().get();
+          this.storageInfo = storageInfo;
+          break;
+        case STORAGE:
+          this.clusteringKey = null;
+          this.partitionKey = null;
+          this.table = null;
+          this.namespace = null;
+          this.storageInfo = storageInfo;
+          break;
+        default:
+          throw new AssertionError(
+              "Unknown mutation atomicity unit: " + storageInfo.getMutationAtomicityUnit());
+      }
+    }
+
+    @Override
+    public boolean equals(Object o) {
+      if (this == o) {
+        return true;
+      }
+      if (!(o instanceof MutationGroup)) {
+        return false;
+      }
+      MutationGroup that = (MutationGroup) o;
+      return Objects.equals(storageInfo.getStorageName(), that.storageInfo.getStorageName())
+          && Objects.equals(namespace, that.namespace)
+          && Objects.equals(table, that.table)
+          && Objects.equals(partitionKey, that.partitionKey)
+          && Objects.equals(clusteringKey, that.clusteringKey);
+    }
+
+    @Override
+    public int hashCode() {
+      return Objects.hash(
+          storageInfo.getStorageName(), namespace, table, partitionKey, clusteringKey);
+    }
+  }
+}
diff --git a/core/src/main/java/com/scalar/db/transaction/consensuscommit/PartitionedMutations.java b/core/src/main/java/com/scalar/db/transaction/consensuscommit/PartitionedMutations.java
diff --git a/...c/main/java/com/scalar/db/transaction/consensuscommit/TwoPhaseConsensusCommitManager.java b/...c/main/java/com/scalar/db/transaction/consensuscommit/TwoPhaseConsensusCommitManager.java
@@ -21,6 +21,7 @@
 import com.scalar.db.common.AbstractTransactionManagerCrudOperableScanner;
 import com.scalar.db.common.AbstractTwoPhaseCommitTransactionManager;
 import com.scalar.db.common.CoreError;
+import com.scalar.db.common.StorageInfoProvider;
 import com.scalar.db.config.DatabaseConfig;
 import com.scalar.db.exception.transaction.CommitConflictException;
 import com.scalar.db.exception.transaction.CrudConflictException;
@@ -81,6 +82,7 @@ public TwoPhaseConsensusCommitManager(
             coordinator,
             tableMetadataManager,
             parallelExecutor,
+            new MutationsGrouper(new StorageInfoProvider(admin)),
             config.isCoordinatorWriteOmissionOnReadOnlyEnabled());
     isIncludeMetadataEnabled = config.isIncludeMetadataEnabled();
     mutationOperationChecker = new ConsensusCommitMutationOperationChecker(tableMetadataManager);
@@ -105,6 +107,7 @@ public TwoPhaseConsensusCommitManager(DatabaseConfig databaseConfig) {
             coordinator,
             tableMetadataManager,
             parallelExecutor,
+            new MutationsGrouper(new StorageInfoProvider(admin)),
             config.isCoordinatorWriteOmissionOnReadOnlyEnabled());
     isIncludeMetadataEnabled = config.isIncludeMetadataEnabled();
     mutationOperationChecker = new ConsensusCommitMutationOperationChecker(tableMetadataManager);