Removed functionality related to retry (#272)

pravinbhat · web-flow · commit 525dc8a10f57 · 2024-07-19T14:00:19.000-04:00
diff --git a/src/main/java/com/datastax/cdm/feature/Guardrail.java b/src/main/java/com/datastax/cdm/feature/Guardrail.java
@@ -100,7 +100,7 @@ private Map<String,Integer> check(Map<String,Integer> currentChecks, int targetI
         int colSize = targetTable.byteCount(targetIndex, targetValue);
         if (logTrace) logger.trace("Column {} at targetIndex {} has size {} bytes", targetTable.getColumnNames(false).get(targetIndex), targetIndex, colSize);
         if (colSize > colSizeInKB * BASE_FACTOR) {
-            if (null==currentChecks) currentChecks = new HashMap();
+            if (null==currentChecks) currentChecks = new HashMap<String,Integer>();
             currentChecks.put(targetTable.getColumnNames(false).get(targetIndex), colSize);
         }
         return currentChecks;
diff --git a/src/main/java/com/datastax/cdm/job/AbstractJobSession.java b/src/main/java/com/datastax/cdm/job/AbstractJobSession.java
@@ -67,10 +67,8 @@ protected AbstractJobSession(CqlSession originSession, CqlSession targetSession,
 
         rateLimiterOrigin = RateLimiter.create(propertyHelper.getInteger(KnownProperties.PERF_RATELIMIT_ORIGIN));
         rateLimiterTarget = RateLimiter.create(propertyHelper.getInteger(KnownProperties.PERF_RATELIMIT_TARGET));
-        maxRetries = propertyHelper.getInteger(KnownProperties.MAX_RETRIES);
         trackRun = propertyHelper.getBoolean(KnownProperties.TRACK_RUN);
 
-        logger.info("PARAM -- Max Retries: {}", maxRetries);
         logger.info("PARAM -- Partition file input: {}", partitionFileInput);
         logger.info("PARAM -- Partition file output: {}", partitionFileOutput);
         logger.info("PARAM -- Origin Rate Limit: {}", rateLimiterOrigin.getRate());
diff --git a/src/main/java/com/datastax/cdm/job/BaseJobSession.java b/src/main/java/com/datastax/cdm/job/BaseJobSession.java
@@ -46,7 +46,6 @@ public abstract class BaseJobSession {
     protected Map<Featureset, Feature> featureMap;
     protected RateLimiter rateLimiterOrigin;
     protected RateLimiter rateLimiterTarget;
-    protected Integer maxRetries = 10;
     
     protected BaseJobSession(SparkConf sc) {
         propertyHelper.initializeSparkConf(sc);
diff --git a/src/main/java/com/datastax/cdm/job/CopyJobSession.java b/src/main/java/com/datastax/cdm/job/CopyJobSession.java
@@ -70,95 +70,86 @@ public synchronized void initCdmRun(Collection<SplitPartitions.Partition> parts,
 			trackRunFeature.initCdmRun(parts, TrackRun.RUN_TYPE.MIGRATE);
 	}
 
-	public void getDataAndInsert(BigInteger min, BigInteger max) {
+	private void getDataAndInsert(BigInteger min, BigInteger max) {
 		ThreadContext.put(THREAD_CONTEXT_LABEL, getThreadLabel(min, max));
 		logger.info("ThreadID: {} Processing min: {} max: {}", Thread.currentThread().getId(), min, max);
 		if (trackRun)
 			trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.STARTED);
 
 		BatchStatement batch = BatchStatement.newInstance(BatchType.UNLOGGED);
-		boolean done = false;
-		int maxAttempts = maxRetries + 1;
 		String guardrailCheck;
-		for (int attempts = 1; attempts <= maxAttempts && !done; attempts++) {
-			jobCounter.threadReset();
-
-			try {
-				OriginSelectByPartitionRangeStatement originSelectByPartitionRangeStatement = this.originSession
-						.getOriginSelectByPartitionRangeStatement();
-				targetUpsertStatement = this.targetSession.getTargetUpsertStatement();
-				targetSelectByPKStatement = this.targetSession.getTargetSelectByPKStatement();
-				ResultSet resultSet = originSelectByPartitionRangeStatement
-						.execute(originSelectByPartitionRangeStatement.bind(min, max));
-				Collection<CompletionStage<AsyncResultSet>> writeResults = new ArrayList<>();
-
-				for (Row originRow : resultSet) {
-					rateLimiterOrigin.acquire(1);
-					jobCounter.threadIncrement(JobCounter.CounterType.READ);
-
-					Record record = new Record(pkFactory.getTargetPK(originRow), originRow, null);
-					if (originSelectByPartitionRangeStatement.shouldFilterRecord(record)) {
-						jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED);
-						continue;
-					}
-
-					for (Record r : pkFactory.toValidRecordList(record)) {
-						if (guardrailEnabled) {
-							guardrailCheck = guardrailFeature.guardrailChecks(r);
-							if (guardrailCheck != null && guardrailCheck != Guardrail.CLEAN_CHECK) {
-								logger.error("Guardrails failed for PrimaryKey {}; {}", r.getPk(), guardrailCheck);
-								jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED);
-								continue;
-							}
-						}
+		jobCounter.threadReset();
+
+		try {
+			OriginSelectByPartitionRangeStatement originSelectByPartitionRangeStatement = this.originSession
+					.getOriginSelectByPartitionRangeStatement();
+			targetUpsertStatement = this.targetSession.getTargetUpsertStatement();
+			targetSelectByPKStatement = this.targetSession.getTargetSelectByPKStatement();
+			ResultSet resultSet = originSelectByPartitionRangeStatement
+					.execute(originSelectByPartitionRangeStatement.bind(min, max));
+			Collection<CompletionStage<AsyncResultSet>> writeResults = new ArrayList<>();
+
+			for (Row originRow : resultSet) {
+				rateLimiterOrigin.acquire(1);
+				jobCounter.threadIncrement(JobCounter.CounterType.READ);
+
+				Record record = new Record(pkFactory.getTargetPK(originRow), originRow, null);
+				if (originSelectByPartitionRangeStatement.shouldFilterRecord(record)) {
+					jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED);
+					continue;
+				}
 
-						BoundStatement boundUpsert = bind(r);
-						if (null == boundUpsert) {
-							jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED); // TODO: this previously
-																						// skipped, why not errCnt?
+				for (Record r : pkFactory.toValidRecordList(record)) {
+					if (guardrailEnabled) {
+						guardrailCheck = guardrailFeature.guardrailChecks(r);
+						if (guardrailCheck != null && guardrailCheck != Guardrail.CLEAN_CHECK) {
+							logger.error("Guardrails failed for PrimaryKey {}; {}", r.getPk(), guardrailCheck);
+							jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED);
 							continue;
 						}
+					}
 
-						rateLimiterTarget.acquire(1);
-						batch = writeAsync(batch, writeResults, boundUpsert);
-						jobCounter.threadIncrement(JobCounter.CounterType.UNFLUSHED);
-
-						if (jobCounter.getCount(JobCounter.CounterType.UNFLUSHED) > fetchSize) {
-							flushAndClearWrites(batch, writeResults);
-							jobCounter.threadIncrement(JobCounter.CounterType.WRITE,
-									jobCounter.getCount(JobCounter.CounterType.UNFLUSHED));
-							jobCounter.threadReset(JobCounter.CounterType.UNFLUSHED);
-						}
+					BoundStatement boundUpsert = bind(r);
+					if (null == boundUpsert) {
+						jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED); // TODO: this previously
+																					// skipped, why not errCnt?
+						continue;
 					}
-				}
 
-				flushAndClearWrites(batch, writeResults);
-				jobCounter.threadIncrement(JobCounter.CounterType.WRITE,
-						jobCounter.getCount(JobCounter.CounterType.UNFLUSHED));
-				jobCounter.threadReset(JobCounter.CounterType.UNFLUSHED);
-				done = true;
-				if (trackRun)
-					trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.PASS);
-
-			} catch (Exception e) {
-				if (attempts == maxAttempts) {
-					jobCounter.threadIncrement(JobCounter.CounterType.ERROR,
-							jobCounter.getCount(JobCounter.CounterType.READ)
-									- jobCounter.getCount(JobCounter.CounterType.WRITE)
-									- jobCounter.getCount(JobCounter.CounterType.SKIPPED));
-					if (trackRun)
-						trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.FAIL);
-					else 
-						logPartitionsInFile(partitionFileOutput, min, max);
+					rateLimiterTarget.acquire(1);
+					batch = writeAsync(batch, writeResults, boundUpsert);
+					jobCounter.threadIncrement(JobCounter.CounterType.UNFLUSHED);
+
+					if (jobCounter.getCount(JobCounter.CounterType.UNFLUSHED) > fetchSize) {
+						flushAndClearWrites(batch, writeResults);
+						jobCounter.threadIncrement(JobCounter.CounterType.WRITE,
+								jobCounter.getCount(JobCounter.CounterType.UNFLUSHED));
+						jobCounter.threadReset(JobCounter.CounterType.UNFLUSHED);
+					}
 				}
-				logger.error("Error occurred during Attempt#: {}", attempts, e);
-				logger.error("Error with PartitionRange -- ThreadID: {} Processing min: {} max: {} -- Attempt# {}",
-						Thread.currentThread().getId(), min, max, attempts);
-				logger.error("Error stats " + jobCounter.getThreadCounters(false));
-			} finally {
-				jobCounter.globalIncrement();
-				printCounts(false);
 			}
+
+			flushAndClearWrites(batch, writeResults);
+			jobCounter.threadIncrement(JobCounter.CounterType.WRITE,
+					jobCounter.getCount(JobCounter.CounterType.UNFLUSHED));
+			jobCounter.threadReset(JobCounter.CounterType.UNFLUSHED);
+			if (trackRun)
+				trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.PASS);
+
+		} catch (Exception e) {
+			jobCounter.threadIncrement(JobCounter.CounterType.ERROR,
+					jobCounter.getCount(JobCounter.CounterType.READ) - jobCounter.getCount(JobCounter.CounterType.WRITE)
+							- jobCounter.getCount(JobCounter.CounterType.SKIPPED));
+			if (trackRun)
+				trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.FAIL);
+			else
+				logPartitionsInFile(partitionFileOutput, min, max);
+			logger.error("Error with PartitionRange -- ThreadID: {} Processing min: {} max: {}",
+					Thread.currentThread().getId(), min, max);
+			logger.error("Error stats " + jobCounter.getThreadCounters(false));
+		} finally {
+			jobCounter.globalIncrement();
+			printCounts(false);
 		}
 	}
 
diff --git a/src/main/java/com/datastax/cdm/job/DiffJobSession.java b/src/main/java/com/datastax/cdm/job/DiffJobSession.java
@@ -125,91 +125,84 @@ public synchronized void initCdmRun(Collection<SplitPartitions.Partition> parts,
 			trackRunFeature.initCdmRun(parts, TrackRun.RUN_TYPE.DIFF_DATA);
 	}
 
-	public void getDataAndDiff(BigInteger min, BigInteger max) {
+	private void getDataAndDiff(BigInteger min, BigInteger max) {
 		ThreadContext.put(THREAD_CONTEXT_LABEL, getThreadLabel(min, max));
 		logger.info("ThreadID: {} Processing min: {} max: {}", Thread.currentThread().getId(), min, max);
 		if (trackRun)
 			trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.STARTED);
 
-		boolean done = false;
 		AtomicBoolean hasDiff = new AtomicBoolean(false);
-		int maxAttempts = maxRetries + 1;
-		for (int attempts = 1; attempts <= maxAttempts && !done; attempts++) {
-			try {
-				jobCounter.threadReset();
-
-				PKFactory pkFactory = originSession.getPKFactory();
-				OriginSelectByPartitionRangeStatement originSelectByPartitionRangeStatement = originSession
-						.getOriginSelectByPartitionRangeStatement();
-				ResultSet resultSet = originSelectByPartitionRangeStatement
-						.execute(originSelectByPartitionRangeStatement.bind(min, max));
-				TargetSelectByPKStatement targetSelectByPKStatement = targetSession.getTargetSelectByPKStatement();
-				Integer fetchSizeInRows = originSession.getCqlTable().getFetchSizeInRows();
-
-				List<Record> recordsToDiff = new ArrayList<>(fetchSizeInRows);
-				StreamSupport.stream(resultSet.spliterator(), false).forEach(originRow -> {
-					rateLimiterOrigin.acquire(1);
-					Record record = new Record(pkFactory.getTargetPK(originRow), originRow, null);
-					jobCounter.threadIncrement(JobCounter.CounterType.READ);
-
-					if (originSelectByPartitionRangeStatement.shouldFilterRecord(record)) {
-						jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED);
-					} else {
-						for (Record r : pkFactory.toValidRecordList(record)) {
-
-							if (guardrailEnabled) {
-								String guardrailCheck = guardrailFeature.guardrailChecks(r);
-								if (guardrailCheck != null && guardrailCheck != Guardrail.CLEAN_CHECK) {
-									logger.error("Guardrails failed for PrimaryKey {}; {}", r.getPk(), guardrailCheck);
-									jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED);
-									continue;
+		try {
+			jobCounter.threadReset();
+
+			PKFactory pkFactory = originSession.getPKFactory();
+			OriginSelectByPartitionRangeStatement originSelectByPartitionRangeStatement = originSession
+					.getOriginSelectByPartitionRangeStatement();
+			ResultSet resultSet = originSelectByPartitionRangeStatement
+					.execute(originSelectByPartitionRangeStatement.bind(min, max));
+			TargetSelectByPKStatement targetSelectByPKStatement = targetSession.getTargetSelectByPKStatement();
+			Integer fetchSizeInRows = originSession.getCqlTable().getFetchSizeInRows();
+
+			List<Record> recordsToDiff = new ArrayList<>(fetchSizeInRows);
+			StreamSupport.stream(resultSet.spliterator(), false).forEach(originRow -> {
+				rateLimiterOrigin.acquire(1);
+				Record record = new Record(pkFactory.getTargetPK(originRow), originRow, null);
+				jobCounter.threadIncrement(JobCounter.CounterType.READ);
+
+				if (originSelectByPartitionRangeStatement.shouldFilterRecord(record)) {
+					jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED);
+				} else {
+					for (Record r : pkFactory.toValidRecordList(record)) {
+
+						if (guardrailEnabled) {
+							String guardrailCheck = guardrailFeature.guardrailChecks(r);
+							if (guardrailCheck != null && guardrailCheck != Guardrail.CLEAN_CHECK) {
+								logger.error("Guardrails failed for PrimaryKey {}; {}", r.getPk(), guardrailCheck);
+								jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED);
+								continue;
+							}
+						}
+
+						rateLimiterTarget.acquire(1);
+						CompletionStage<AsyncResultSet> targetResult = targetSelectByPKStatement
+								.getAsyncResult(r.getPk());
+
+						if (null == targetResult) {
+							jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED);
+						} else {
+							r.setAsyncTargetRow(targetResult);
+							recordsToDiff.add(r);
+							if (recordsToDiff.size() > fetchSizeInRows) {
+								if (diffAndClear(recordsToDiff)) {
+									hasDiff.set(true);
 								}
 							}
+						} // targetRecord!=null
+					} // recordSet iterator
+				} // shouldFilterRecord
+			});
+			if (diffAndClear(recordsToDiff)) {
+				hasDiff.set(true);
+			}
 
-							rateLimiterTarget.acquire(1);
-							CompletionStage<AsyncResultSet> targetResult = targetSelectByPKStatement
-									.getAsyncResult(r.getPk());
-
-							if (null == targetResult) {
-								jobCounter.threadIncrement(JobCounter.CounterType.SKIPPED);
-							} else {
-								r.setAsyncTargetRow(targetResult);
-								recordsToDiff.add(r);
-								if (recordsToDiff.size() > fetchSizeInRows) {
-									if (diffAndClear(recordsToDiff)) {
-										hasDiff.set(true);
-									}
-								}
-							} // targetRecord!=null
-						} // recordSet iterator
-					} // shouldFilterRecord
-				});
-				if (diffAndClear(recordsToDiff)) {
-					hasDiff.set(true);
-				}
-				done = true;
-
-				if (hasDiff.get()) {
-					if (trackRun)
-						trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.DIFF);
-					else if (appendPartitionOnDiff)
-						logPartitionsInFile(partitionFileOutput, min, max);
-				} else if (trackRun) {
-					trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.PASS);
-				}
-			} catch (Exception e) {
-				logger.error("Error with PartitionRange -- ThreadID: {} Processing min: {} max: {} -- Attempt# {}",
-						Thread.currentThread().getId(), min, max, attempts, e);
-				if (attempts == maxAttempts) {
-					if (trackRun)
-						trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.FAIL);
-					else
-						logPartitionsInFile(partitionFileOutput, min, max);
-				}
-			} finally {
-				jobCounter.globalIncrement();
-				printCounts(false);
+			if (hasDiff.get()) {
+				if (trackRun)
+					trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.DIFF);
+				else if (appendPartitionOnDiff)
+					logPartitionsInFile(partitionFileOutput, min, max);
+			} else if (trackRun) {
+				trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.PASS);
 			}
+		} catch (Exception e) {
+			logger.error("Error with PartitionRange -- ThreadID: {} Processing min: {} max: {}",
+					Thread.currentThread().getId(), min, max, e);
+			if (trackRun)
+				trackRunFeature.updateCdmRun(min, TrackRun.RUN_STATUS.FAIL);
+			else
+				logPartitionsInFile(partitionFileOutput, min, max);
+		} finally {
+			jobCounter.globalIncrement();
+			printCounts(false);
 		}
 	}
 
diff --git a/src/main/java/com/datastax/cdm/properties/KnownProperties.java b/src/main/java/com/datastax/cdm/properties/KnownProperties.java
@@ -119,7 +119,6 @@ public enum PropertyType {
 	public static final String READ_CL = "spark.cdm.perfops.consistency.read";
 	public static final String WRITE_CL = "spark.cdm.perfops.consistency.write";
 	public static final String PERF_FETCH_SIZE = "spark.cdm.perfops.fetchSizeInRows";
-	public static final String MAX_RETRIES = "spark.cdm.perfops.errorLimit";
 	public static final String PRINT_STATS_AFTER = "spark.cdm.perfops.printStatsAfter";
 	public static final String PRINT_STATS_PER_PART = "spark.cdm.perfops.printStatsPerPart";
 
@@ -154,8 +153,6 @@ public enum PropertyType {
 		defaults.put(PRINT_STATS_PER_PART, "false");
 		types.put(PERF_FETCH_SIZE, PropertyType.NUMBER);
 		defaults.put(PERF_FETCH_SIZE, "1000");
-		types.put(MAX_RETRIES, PropertyType.NUMBER);
-		defaults.put(MAX_RETRIES, "0");
 	}
 
 	// ==========================================================================
diff --git a/src/resources/cdm-detailed.properties b/src/resources/cdm-detailed.properties
@@ -193,7 +193,7 @@ spark.cdm.trackRun.previousRunId                  0
 #spark.cdm.tokenrange.partitionFile.appendOnDiff  false
 
 #===========================================================================================================
-# Performance and Operations Parameters affecting throughput, error handling, and similar concerns.
+# Performance and Operations Parameters affecting throughput and similar concerns.
 # 
 # Recommended Parameters:
 #  spark.cdm.perfops
@@ -228,11 +228,8 @@ spark.cdm.trackRun.previousRunId                  0
 #                           entry will be made.
 #    .printStatsPerPart   : Default is false. Print statistics for each part after it is processed.
 #    .fetchSizeInRows     : Default is 1000. This affects the frequency of reads from Origin, and also the
-#                           frequency of flushes to Target. 
-#    .errorLimit          : Default is 0. Controls how many errors a thread may encounter during Migrate
-#                           and DiffData operations before failing. It is recommended to set this to a non-
-#                           zero value only when not doing a mutation-type operation, e.g. when running 
-#                           DiffData without .autocorrect.
+#                           frequency of flushes to Target. A larger value will reduce the number of reads
+#                           and writes, but will increase the memory requirements.
 #-----------------------------------------------------------------------------------------------------------
 spark.cdm.perfops.numParts                        5000
 spark.cdm.perfops.batchSize                       5
@@ -429,4 +426,3 @@ spark.cdm.perfops.ratelimit.target                20000
 #spark.cdm.connect.target.tls.keyStore.path
 #spark.cdm.connect.target.tls.keyStore.password
 #spark.cdm.connect.target.tls.enabledAlgorithms    TLS_RSA_WITH_AES_128_CBC_SHA,TLS_RSA_WITH_AES_256_CBC_SHA
-
diff --git a/src/resources/cdm.properties b/src/resources/cdm.properties

Original file line number	Diff line number	Diff line change
`@@ -100,7 +100,7 @@ private Map<String,Integer> check(Map<String,Integer> currentChecks, int targetI`
`100`	`100`	`int colSize = targetTable.byteCount(targetIndex, targetValue);`
`101`	`101`	`if (logTrace) logger.trace("Column {} at targetIndex {} has size {} bytes", targetTable.getColumnNames(false).get(targetIndex), targetIndex, colSize);`
`102`	`102`	`if (colSize > colSizeInKB * BASE_FACTOR) {`
`103`		`- if (null==currentChecks) currentChecks = new HashMap();`
	`103`	`+ if (null==currentChecks) currentChecks = new HashMap<String,Integer>();`
`104`	`104`	`currentChecks.put(targetTable.getColumnNames(false).get(targetIndex), colSize);`
`105`	`105`	`}`
`106`	`106`	`return currentChecks;`