Skip to content

Commit 9f38c0a

Browse files
Merge branch 'main' into feature/exception_handler_refactor
# Conflicts: # src/main/java/com/datastax/cdm/job/AbstractJobSession.java # src/resources/cdm.properties
2 parents 35906b8 + 6ac18cc commit 9f38c0a

File tree

40 files changed

+581
-454
lines changed

40 files changed

+581
-454
lines changed

PERF/cdm-v4.properties

Lines changed: 28 additions & 28 deletions
Original file line numberDiff line numberDiff line change
@@ -20,8 +20,8 @@
2020
# Connections are made with the Spark Cassandra Connector; conventions there likely work here
2121
# See https://github.com/datastax/spark-cassandra-connector/blob/master/doc/reference.md
2222
#
23-
# spark.cdm.origin.connect
24-
# spark.cdm.target.connect
23+
# spark.cdm.connect.origin
24+
# spark.cdm.connect.target
2525
# .host : Default is localhost. Hostname/IP address of the cluster; may be a comma-separated list,
2626
# and can follow the <hostname>:<port> convention.
2727
# .port : Default is 9042. Port number to use if not specified on .host
@@ -31,17 +31,17 @@
3131
#
3232
# You must set either .host or .scb.
3333
#-----------------------------------------------------------------------------------------------------------
34-
spark.cdm.origin.connect.host cass-origin
35-
spark.cdm.origin.connect.port 9042
36-
#spark.cdm.origin.connect.scb file:///aaa/bbb/secure-connect-enterprise.zip
37-
spark.cdm.origin.connect.username cassandra
38-
spark.cdm.origin.connect.password cassandra
34+
spark.cdm.connect.origin.host cass-origin
35+
spark.cdm.connect.origin.port 9042
36+
#spark.cdm.connect.origin.scb file:///aaa/bbb/secure-connect-enterprise.zip
37+
spark.cdm.connect.origin.username cassandra
38+
spark.cdm.connect.origin.password cassandra
3939

40-
spark.cdm.target.connect.host cass-target
41-
spark.cdm.target.connect.port 9042
42-
#spark.cdm.target.connect.scb file:///aaa/bbb/secure-connect-enterprise.zip
43-
spark.cdm.target.connect.username cassandra
44-
spark.cdm.target.connect.password cassandra
40+
spark.cdm.connect.target.host cass-target
41+
spark.cdm.connect.target.port 9042
42+
#spark.cdm.connect.target.scb file:///aaa/bbb/secure-connect-enterprise.zip
43+
spark.cdm.connect.target.username cassandra
44+
spark.cdm.connect.target.password cassandra
4545

4646
#===========================================================================================================
4747
# Details about the Origin Schema
@@ -326,8 +326,8 @@ spark.cdm.perfops.writeRateLimit 5000
326326
# TLS (SSL) connection parameters, if so configured. Note that Secure Bundles embed these details.
327327
# See https://github.com/datastax/spark-cassandra-connector/blob/master/doc/reference.md
328328
#
329-
# spark.cdm.origin.connect.tls
330-
# spark.cdm.target.connect.tls
329+
# spark.cdm.connect.origin.tls
330+
# spark.cdm.connect.target.tls
331331
# .enabled : Default is false. Set to true if TLS is used.
332332
# .trustStore
333333
# .path : Filepath to the Java truststore file
@@ -338,20 +338,20 @@ spark.cdm.perfops.writeRateLimit 5000
338338
# .password : Password needed to open the keystore
339339
# .enabledAlgorithms : Default is TLS_RSA_WITH_AES_128_CBC_SHA,TLS_RSA_WITH_AES_256_CBC_SHA
340340
#-----------------------------------------------------------------------------------------------------------
341-
#spark.cdm.origin.connect.tls.enabled false
342-
#spark.cdm.origin.connect.tls.trustStore.path
343-
#spark.cdm.origin.connect.tls.trustStore.password
344-
#spark.cdm.origin.connect.tls.trustStore.type JKS
345-
#spark.cdm.origin.connect.tls.keyStore.path
346-
#spark.cdm.origin.connect.tls.keyStore.password
347-
#spark.cdm.origin.connect.tls.enabledAlgorithms TLS_RSA_WITH_AES_128_CBC_SHA,TLS_RSA_WITH_AES_256_CBC_SHA
341+
#spark.cdm.connect.origin.tls.enabled false
342+
#spark.cdm.connect.origin.tls.trustStore.path
343+
#spark.cdm.connect.origin.tls.trustStore.password
344+
#spark.cdm.connect.origin.tls.trustStore.type JKS
345+
#spark.cdm.connect.origin.tls.keyStore.path
346+
#spark.cdm.connect.origin.tls.keyStore.password
347+
#spark.cdm.connect.origin.tls.enabledAlgorithms TLS_RSA_WITH_AES_128_CBC_SHA,TLS_RSA_WITH_AES_256_CBC_SHA
348348

349-
#spark.cdm.target.connect.tls.enabled false
350-
#spark.cdm.target.connect.tls.trustStore.path
351-
#spark.cdm.target.connect.tls.trustStore.password
352-
#spark.cdm.target.connect.tls.trustStore.type JKS
353-
#spark.cdm.target.connect.tls.keyStore.path
354-
#spark.cdm.target.connect.tls.keyStore.password
355-
#spark.cdm.target.connect.tls.enabledAlgorithms TLS_RSA_WITH_AES_128_CBC_SHA,TLS_RSA_WITH_AES_256_CBC_SHA
349+
#spark.cdm.connect.target.tls.enabled false
350+
#spark.cdm.connect.target.tls.trustStore.path
351+
#spark.cdm.connect.target.tls.trustStore.password
352+
#spark.cdm.connect.target.tls.trustStore.type JKS
353+
#spark.cdm.connect.target.tls.keyStore.path
354+
#spark.cdm.connect.target.tls.keyStore.password
355+
#spark.cdm.connect.target.tls.enabledAlgorithms TLS_RSA_WITH_AES_128_CBC_SHA,TLS_RSA_WITH_AES_256_CBC_SHA
356356

357357

README.md

Lines changed: 5 additions & 4 deletions
Original file line numberDiff line numberDiff line change
@@ -26,8 +26,9 @@ tar -xvzf spark-3.3.1-bin-hadoop3.tgz
2626

2727
> :warning: Note that Version 4 of the tool is not backward-compatible with .properties files created in previous versions, and that package names have changed.
2828
29-
1. `cdm.properties` file needs to be configured as applicable for the environment. Parameter descriptions and defaults are described in the file.
30-
> A sample properties file configuration can be [found here](./src/resources/cdm.properties)
29+
1. `cdm.properties` file needs to be configured as applicable for the environment. Parameter descriptions and defaults are described in the file. The file can have any name, it does not need to be `cdm.properties`.
30+
> * A simplified sample properties file configuration can be found here as [cdm.properties](./src/resources/cdm.properties)
31+
> * A complete sample properties file configuration can be found here as [cdm-detailed.properties](./src/resources/cdm-detailed.properties)
3132
2. Place the properties file where it can be accessed while running the job via spark-submit.
3233
3. Run the below job using `spark-submit` command as shown below:
3334

@@ -119,12 +120,12 @@ When running in above mode the tool assumes a `partitions.csv` file to be presen
119120
# Perform large-field Guardrail violation checks
120121
- The tool can be used to identify large fields from a table that may break you cluster guardrails (e.g. AstraDB has a 10MB limit for a single large field) `--class datastax.astra.migrate.Guardrail` as shown below
121122
```
122-
./spark-submit --properties-file cdmGuardrail.properties /
123+
./spark-submit --properties-file cdm.properties /
123124
--conf spark.origin.keyspaceTable="<keyspace-name>.<table-name>" /
125+
--conf spark.cdm.feature.guardrail.colSizeInKB=10000 /
124126
--master "local[*]" /
125127
--class datastax.cdm.job.GuardrailCheck cassandra-data-migrator-4.x.x.jar &> logfile_name_$(date +%Y%m%d_%H_%M).txt
126128
```
127-
> A sample Guardrail properties file can be [found here](./src/resources/cdmGuardrail.properties)
128129

129130
# Features
130131
- Auto-detects table schema (column names, types, keys, collections, UDTs, etc.)

SIT/features/01_constant_column/fix.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
spark.cdm.origin.connect.host cdm-sit-cass
2-
spark.cdm.target.connect.host cdm-sit-cass
1+
spark.cdm.connect.origin.host cdm-sit-cass
2+
spark.cdm.connect.target.host cdm-sit-cass
33

44
spark.cdm.schema.origin.keyspaceTable origin.feature_constant_column
55
spark.cdm.schema.target.keyspaceTable target.feature_constant_column

SIT/features/01_constant_column/migrate.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
spark.cdm.origin.connect.host cdm-sit-cass
2-
spark.cdm.target.connect.host cdm-sit-cass
1+
spark.cdm.connect.origin.host cdm-sit-cass
2+
spark.cdm.connect.target.host cdm-sit-cass
33

44
spark.cdm.schema.origin.keyspaceTable origin.feature_constant_column
55
spark.cdm.schema.target.keyspaceTable target.feature_constant_column

SIT/features/02_explode_map/fix.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
spark.cdm.origin.connect.host cdm-sit-cass
2-
spark.cdm.target.connect.host cdm-sit-cass
1+
spark.cdm.connect.origin.host cdm-sit-cass
2+
spark.cdm.connect.target.host cdm-sit-cass
33

44
spark.cdm.schema.origin.keyspaceTable origin.feature_explode_map
55
spark.cdm.schema.target.keyspaceTable target.feature_explode_map

SIT/features/02_explode_map/migrate.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
spark.cdm.origin.connect.host cdm-sit-cass
2-
spark.cdm.target.connect.host cdm-sit-cass
1+
spark.cdm.connect.origin.host cdm-sit-cass
2+
spark.cdm.connect.target.host cdm-sit-cass
33

44
spark.cdm.schema.origin.keyspaceTable origin.feature_explode_map
55
spark.cdm.schema.target.keyspaceTable target.feature_explode_map

SIT/features/03_codec/fix.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
spark.cdm.origin.connect.host cdm-sit-cass
2-
spark.cdm.target.connect.host cdm-sit-cass
1+
spark.cdm.connect.origin.host cdm-sit-cass
2+
spark.cdm.connect.target.host cdm-sit-cass
33

44
spark.cdm.schema.origin.keyspaceTable origin.codec
55
spark.cdm.schema.target.keyspaceTable target.codec

SIT/features/03_codec/migrate.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
spark.cdm.origin.connect.host cdm-sit-cass
2-
spark.cdm.target.connect.host cdm-sit-cass
1+
spark.cdm.connect.origin.host cdm-sit-cass
2+
spark.cdm.connect.target.host cdm-sit-cass
33

44
spark.cdm.schema.origin.keyspaceTable origin.codec
55
spark.cdm.schema.target.keyspaceTable target.codec

SIT/features/04_udt_mapper/fix.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
spark.cdm.origin.connect.host cdm-sit-cass
2-
spark.cdm.target.connect.host cdm-sit-cass
1+
spark.cdm.connect.origin.host cdm-sit-cass
2+
spark.cdm.connect.target.host cdm-sit-cass
33

44
spark.cdm.schema.origin.keyspaceTable origin.udt_mapper
55
spark.cdm.schema.target.keyspaceTable target.udt_mapper

SIT/features/04_udt_mapper/migrate.properties

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,5 +1,5 @@
1-
spark.cdm.origin.connect.host cdm-sit-cass
2-
spark.cdm.target.connect.host cdm-sit-cass
1+
spark.cdm.connect.origin.host cdm-sit-cass
2+
spark.cdm.connect.target.host cdm-sit-cass
33

44
spark.cdm.schema.origin.keyspaceTable origin.udt_mapper
55
spark.cdm.schema.target.keyspaceTable target.udt_mapper

0 commit comments

Comments
 (0)