datastax
diff --git a/‎.idea/libraries/Maven__org_scala_lang_scala_library_2_11_8.xml
Lines changed: 0 additions & 23 deletions b/‎.idea/libraries/Maven__org_scala_lang_scala_library_2_11_8.xml
Lines changed: 0 additions & 23 deletions
diff --git a/‎README.md
Lines changed: 2 additions & 6 deletions b/‎README.md
Lines changed: 2 additions & 6 deletions
diff --git a/‎pom.xml
Lines changed: 1 addition & 1 deletion b/‎pom.xml
Lines changed: 1 addition & 1 deletion
diff --git a/‎src/main/java/datastax/astra/migrate/AbstractJobSession.java
Lines changed: 22 additions & 25 deletions b/‎src/main/java/datastax/astra/migrate/AbstractJobSession.java
Lines changed: 22 additions & 25 deletions
diff --git a/‎src/main/java/datastax/astra/migrate/CopyJobSession.java
Lines changed: 6 additions & 10 deletions b/‎src/main/java/datastax/astra/migrate/CopyJobSession.java
Lines changed: 6 additions & 10 deletions
diff --git a/‎src/main/java/datastax/astra/migrate/DiffJobSession.java
Lines changed: 7 additions & 13 deletions b/‎src/main/java/datastax/astra/migrate/DiffJobSession.java
Lines changed: 7 additions & 13 deletions
@@ -25,8 +25,6 @@ tar -xvzf <spark downloaded file name>
 ```
 ./spark-submit --properties-file sparkConf.properties /
 --master "local[*]" /
---conf spark.migrate.source.minPartition=-9223372036854775808 /
---conf spark.migrate.source.maxPartition=9223372036854775807 /
 --class datastax.astra.migrate.Migrate cassandra-data-migrator-1.x.jar &> logfile_name.txt
 ```
 
@@ -40,8 +38,6 @@ Note: Above command also generates a log file `logfile_name.txt` to avoid log ou
 ```
 ./spark-submit --properties-file sparkConf.properties /
 --master "local[*]" /
---conf spark.migrate.source.minPartition=-9223372036854775808 /
---conf spark.migrate.source.maxPartition=9223372036854775807 /
 --class datastax.astra.migrate.DiffData cassandra-data-migrator-1.x.jar &> logfile_name.txt
 ```
 
@@ -60,8 +56,8 @@ Note: Above command also generates a log file `logfile_name.txt` to avoid log ou
 - Enable/disable this feature using one or both of the below setting in the config file
 
 ```
-spark.migrate.destination.autocorrect.missing                   true|false
-spark.migrate.destination.autocorrect.mismatch                  true|false
+spark.destination.autocorrect.missing                   true|false
+spark.destination.autocorrect.mismatch                  true|false
 ```
 
 # Additional features
 
@@ -3,7 +3,7 @@
 
   <groupId>datastax.astra.migrate</groupId>
   <artifactId>cassandra-data-migrator</artifactId>
-  <version>1.0</version>
+  <version>1.2</version>
   <packaging>jar</packaging>
 
   <properties>
 
@@ -34,6 +34,7 @@ public abstract class AbstractJobSession {
 
     protected CqlSession sourceSession;
     protected CqlSession astraSession;
+    protected List<MigrateDataType> selectColTypes = new ArrayList<MigrateDataType>();
     protected List<MigrateDataType> idColTypes = new ArrayList<MigrateDataType>();
 
     protected Integer batchSize = 1;
@@ -47,7 +48,6 @@ public abstract class AbstractJobSession {
     protected List<Integer> writeTimeStampCols = new ArrayList<Integer>();
     protected List<Integer> ttlCols = new ArrayList<Integer>();
     protected Boolean isCounterTable;
-    protected Integer counterDeltaMaxIndex = 0;
 
     protected String sourceKeyspaceTable;
     protected String astraKeyspaceTable;
@@ -58,22 +58,22 @@ protected AbstractJobSession(CqlSession sourceSession, CqlSession astraSession,
         this.sourceSession = sourceSession;
         this.astraSession = astraSession;
 
-        batchSize = new Integer(sparkConf.get("spark.migrate.batchSize", "1"));
-        printStatsAfter = new Integer(sparkConf.get("spark.migrate.printStatsAfter", "100000"));
+        batchSize = new Integer(sparkConf.get("spark.batchSize", "1"));
+        printStatsAfter = new Integer(sparkConf.get("spark.printStatsAfter", "100000"));
         if (printStatsAfter < 1) {
             printStatsAfter = 100000;
         }
 
-        readLimiter = RateLimiter.create(new Integer(sparkConf.get("spark.migrate.readRateLimit", "20000")));
-        writeLimiter = RateLimiter.create(new Integer(sparkConf.get("spark.migrate.writeRateLimit", "40000")));
-        maxRetries = Integer.parseInt(sparkConf.get("spark.migrate.maxRetries", "10"));
+        readLimiter = RateLimiter.create(new Integer(sparkConf.get("spark.readRateLimit", "20000")));
+        writeLimiter = RateLimiter.create(new Integer(sparkConf.get("spark.writeRateLimit", "40000")));
+        maxRetries = Integer.parseInt(sparkConf.get("spark.maxRetries", "10"));
 
-        sourceKeyspaceTable = sparkConf.get("spark.migrate.source.keyspaceTable");
-        astraKeyspaceTable = sparkConf.get("spark.migrate.destination.keyspaceTable");
+        sourceKeyspaceTable = sparkConf.get("spark.source.keyspaceTable");
+        astraKeyspaceTable = sparkConf.get("spark.destination.keyspaceTable");
 
-        isPreserveTTLWritetime = Boolean.parseBoolean(sparkConf.get("spark.migrate.preserveTTLWriteTime", "false"));
+        isPreserveTTLWritetime = Boolean.parseBoolean(sparkConf.get("spark.preserveTTLWriteTime", "false"));
         if (isPreserveTTLWritetime) {
-            String ttlColsStr = sparkConf.get("spark.migrate.source.ttl.cols");
+            String ttlColsStr = sparkConf.get("spark.source.ttl.cols");
             if (null != ttlColsStr && ttlColsStr.trim().length() > 0) {
                 for (String ttlCol : ttlColsStr.split(",")) {
                     ttlCols.add(Integer.parseInt(ttlCol));
@@ -82,11 +82,11 @@ protected AbstractJobSession(CqlSession sourceSession, CqlSession astraSession,
         }
 
         writeTimeStampFilter = Boolean
-                .parseBoolean(sparkConf.get("spark.migrate.source.writeTimeStampFilter", "false"));
+                .parseBoolean(sparkConf.get("spark.source.writeTimeStampFilter", "false"));
         // batchsize set to 1 if there is a writeFilter
         if (writeTimeStampFilter) {
             batchSize = 1;
-            String writeTimestampColsStr = sparkConf.get("spark.migrate.source.writeTimeStampFilter.cols");
+            String writeTimestampColsStr = sparkConf.get("spark.source.writeTimeStampFilter.cols");
             if (null != writeTimestampColsStr && writeTimestampColsStr.trim().length() > 0) {
                 for (String writeTimeStampCol : writeTimestampColsStr.split(",")) {
                     writeTimeStampCols.add(Integer.parseInt(writeTimeStampCol));
@@ -95,12 +95,12 @@ protected AbstractJobSession(CqlSession sourceSession, CqlSession astraSession,
         }
 
         String minWriteTimeStampFilterStr =
-                sparkConf.get("spark.migrate.source.minWriteTimeStampFilter", "0");
+                sparkConf.get("spark.source.minWriteTimeStampFilter", "0");
         if (null != minWriteTimeStampFilterStr && minWriteTimeStampFilterStr.trim().length() > 1) {
             minWriteTimeStampFilter = Long.parseLong(minWriteTimeStampFilterStr);
         }
         String maxWriteTimeStampFilterStr =
-                sparkConf.get("spark.migrate.source.maxWriteTimeStampFilter", "0");
+                sparkConf.get("spark.source.maxWriteTimeStampFilter", "0");
         if (null != maxWriteTimeStampFilterStr && maxWriteTimeStampFilterStr.trim().length() > 1) {
             maxWriteTimeStampFilter = Long.parseLong(maxWriteTimeStampFilterStr);
         }
@@ -115,18 +115,15 @@ protected AbstractJobSession(CqlSession sourceSession, CqlSession astraSession,
         logger.info(" DEFAULT -- isPreserveTTLWritetime: " + isPreserveTTLWritetime);
         logger.info(" DEFAULT -- TTLCols: " + ttlCols);
 
-        hasRandomPartitioner = Boolean.parseBoolean(sparkConf.get("spark.migrate.source.hasRandomPartitioner", "false"));
+        hasRandomPartitioner = Boolean.parseBoolean(sparkConf.get("spark.source.hasRandomPartitioner", "false"));
 
-        isCounterTable = Boolean.parseBoolean(sparkConf.get("spark.migrate.source.counterTable", "false"));
+        isCounterTable = Boolean.parseBoolean(sparkConf.get("spark.counterTable", "false"));
+        selectColTypes = getTypes(sparkConf.get("spark.diff.select.types"));
+        String partionKey = sparkConf.get("spark.query.cols.partitionKey");
+        String idCols = sparkConf.get("spark.query.cols.id");
+        idColTypes = getTypes(sparkConf.get("spark.query.cols.id.types"));
 
-        counterDeltaMaxIndex = Integer
-                .parseInt(sparkConf.get("spark.migrate.source.counterTable.update.max.counter.index", "0"));
-
-        String partionKey = sparkConf.get("spark.migrate.query.cols.partitionKey");
-        String idCols = sparkConf.get("spark.migrate.query.cols.id");
-        idColTypes = getTypes(sparkConf.get("spark.migrate.query.cols.id.types"));
-
-        String selectCols = sparkConf.get("spark.migrate.query.cols.select");
+        String selectCols = sparkConf.get("spark.query.cols.select");
 
         String idBinds = "";
         int count = 1;
@@ -139,7 +136,7 @@ protected AbstractJobSession(CqlSession sourceSession, CqlSession astraSession,
             count++;
         }
 
-        sourceSelectCondition = sparkConf.get("spark.migrate.query.cols.select.condition", "");
+        sourceSelectCondition = sparkConf.get("spark.query.cols.select.condition", "");
         sourceSelectStatement = sourceSession.prepare(
                 "select " + selectCols + " from " + sourceKeyspaceTable + " where token(" + partionKey.trim()
                         + ") >= ? and token(" + partionKey.trim() + ") <= ?  " + sourceSelectCondition + " ALLOW FILTERING");
 
@@ -40,8 +40,8 @@ public static CopyJobSession getInstance(CqlSession sourceSession, CqlSession as
     protected CopyJobSession(CqlSession sourceSession, CqlSession astraSession, SparkConf sparkConf) {
         super(sourceSession, astraSession, sparkConf);
 
-        String insertCols = sparkConf.get("spark.migrate.query.cols.insert");
-        insertColTypes = getTypes(sparkConf.get("spark.migrate.query.cols.insert.types"));
+        String insertCols = sparkConf.get("spark.query.cols.insert");
+        insertColTypes = getTypes(sparkConf.get("spark.query.cols.insert.types"));
         String insertBinds = "";
         int count = 1;
         for (String str : insertCols.split(",")) {
@@ -54,12 +54,12 @@ protected CopyJobSession(CqlSession sourceSession, CqlSession astraSession, Spar
         }
 
         if (isCounterTable) {
-            String updateSelectMappingStr = sparkConf.get("spark.migrate.source.counterTable.update.select.index", "0");
+            String updateSelectMappingStr = sparkConf.get("spark.counterTable.cql.index", "0");
             for (String updateSelectIndex : updateSelectMappingStr.split(",")) {
                 updateSelectMapping.add(Integer.parseInt(updateSelectIndex));
             }
 
-            String counterTableUpdate = sparkConf.get("spark.migrate.source.counterTable.update.cql");
+            String counterTableUpdate = sparkConf.get("spark.counterTable.cql");
             astraInsertStatement = astraSession.prepare(counterTableUpdate);
         } else {
             if (isPreserveTTLWritetime) {
@@ -181,8 +181,8 @@ public BoundStatement bindInsert(PreparedStatement insertStatement, Row sourceRo
             for (int index = 0; index < insertColTypes.size(); index++) {
                 MigrateDataType dataType = insertColTypes.get(index);
                 // compute the counter delta if reading from astra for the difference
-                if (astraRow != null && isCounterTable && index <= counterDeltaMaxIndex) {
-                    boundInsertStatement = boundInsertStatement.set(index, getCounterDelta(sourceRow.getLong(updateSelectMapping.get(index)), astraRow.getLong(updateSelectMapping.get(index))), Long.class);
+                if (astraRow != null && index < (selectColTypes.size() - idColTypes.size())) {
+                    boundInsertStatement = boundInsertStatement.set(index, (sourceRow.getLong(updateSelectMapping.get(index)) - astraRow.getLong(updateSelectMapping.get(index))), Long.class);
                 } else {
                     boundInsertStatement = boundInsertStatement.set(index, getData(dataType, updateSelectMapping.get(index), sourceRow), dataType.typeClass);
                 }
@@ -217,8 +217,4 @@ public BoundStatement bindInsert(PreparedStatement insertStatement, Row sourceRo
         return boundInsertStatement;
     }
 
-    public Long getCounterDelta(Long sourceRow, Long astraRow) {
-        return sourceRow - astraRow;
-    }
-
 }
@@ -15,14 +15,6 @@
 import java.util.stream.IntStream;
 import java.util.stream.StreamSupport;
 
-/*
-(
-    data_id text,
-    cylinder text,
-    value blob,
-    PRIMARY KEY (data_id, cylinder)
-)
- */
 public class DiffJobSession extends CopyJobSession {
 
     public static Logger logger = Logger.getLogger(DiffJobSession.class);
@@ -36,7 +28,6 @@ public class DiffJobSession extends CopyJobSession {
     private AtomicLong validCounter = new AtomicLong(0);
     private AtomicLong skippedCounter = new AtomicLong(0);
 
-    protected List<MigrateDataType> selectColTypes = new ArrayList<MigrateDataType>();
     protected Boolean autoCorrectMissing = false;
     protected Boolean autoCorrectMismatch = false;
 
@@ -55,9 +46,8 @@ public static DiffJobSession getInstance(CqlSession sourceSession, CqlSession as
     private DiffJobSession(CqlSession sourceSession, CqlSession astraSession, SparkConf sparkConf) {
         super(sourceSession, astraSession, sparkConf);
 
-        selectColTypes = getTypes(sparkConf.get("spark.migrate.diff.select.types"));
-        autoCorrectMissing = Boolean.parseBoolean(sparkConf.get("spark.migrate.destination.autocorrect.missing", "false"));
-        autoCorrectMismatch = Boolean.parseBoolean(sparkConf.get("spark.migrate.destination.autocorrect.mismatch", "false"));
+        autoCorrectMissing = Boolean.parseBoolean(sparkConf.get("spark.destination.autocorrect.missing", "false"));
+        autoCorrectMismatch = Boolean.parseBoolean(sparkConf.get("spark.destination.autocorrect.mismatch", "false"));
     }
 
     public void getDataAndDiff(BigInteger min, BigInteger max) {
@@ -142,7 +132,11 @@ private void diff(Row sourceRow, Row astraRow) {
             logger.error("Data mismatch found -  Key: " + getKey(sourceRow) + " Data: " + diffData);
 
             if (autoCorrectMismatch) {
-                astraSession.execute(bindInsert(astraInsertStatement, sourceRow, null));
+                if (isCounterTable) {
+                    astraSession.execute(bindInsert(astraInsertStatement, sourceRow, astraRow));
+                } else {
+                    astraSession.execute(bindInsert(astraInsertStatement, sourceRow, null));
+                }
                 correctedMismatchCounter.incrementAndGet();
                 logger.error("Corrected mismatch data in Astra: " + getKey(sourceRow));
             }