@@ -27,7 +27,8 @@ object LdbcDatagen extends SparkApp {
27
27
numThreads : Option [Int ] = None ,
28
28
format : String = " csv" ,
29
29
generateFactors : Boolean = false ,
30
- formatOptions : Map [String , String ] = Map .empty
30
+ formatOptions : Map [String , String ] = Map .empty,
31
+ oversizeFactor : Option [Double ] = None
31
32
)
32
33
33
34
def main (args : Array [String ]): Unit = {
@@ -65,6 +66,12 @@ object LdbcDatagen extends SparkApp {
65
66
.action((x, c) => args.mode.set(c)(x))
66
67
.text(" Generation mode. Options: raw, bi, interactive. Default: raw" )
67
68
69
+ opt[Double ](" oversize-factor" )
70
+ .action((x, c) => args.oversizeFactor.set(c)(Some (x)))
71
+ .text(" Controls size of files relative to Persons. " +
72
+ " Values larger than 1 will result in less but larger files. " +
73
+ " Smaller values result in more, smaller files" )
74
+
68
75
opt[Double ](" bulkload-portion" )
69
76
.action((x, c) => args.bulkloadPortion.set(c)(x))
70
77
.text(" Bulkload portion. Only applicable to BI and interactive modes" )
@@ -113,14 +120,15 @@ object LdbcDatagen extends SparkApp {
113
120
params = args.params,
114
121
paramFile = args.paramFile,
115
122
outputDir = args.outputDir,
116
- numThreads = args.numThreads
123
+ numThreads = args.numThreads,
124
+ oversizeFactor = args.oversizeFactor
117
125
)
118
126
119
127
val generatorConfig = GenerationStage .buildConfig(generatorArgs)
120
128
121
129
DatagenContext .initialize(generatorConfig)
122
130
123
- GenerationStage .run(generatorConfig)
131
+ GenerationStage .run(generatorArgs, generatorConfig)
124
132
125
133
if (args.generateFactors) {
126
134
val factorArgs = FactorGenerationStage .Args ()
0 commit comments