@@ -22,110 +22,77 @@ workflows:
22
22
executors :
23
23
my-executor :
24
24
machine :
25
- image : ubuntu-2004:202008-01
25
+ image : ubuntu-2204:2022.04.1
26
+ docker_layer_caching : true
26
27
working_directory : ~/ldbc/ldbc_snb_datagen
27
28
28
29
jobs :
29
30
test :
30
31
executor : my-executor
31
32
environment :
32
- PLATFORM_VERSION : 2.12_spark3.1
33
+ PLATFORM_VERSION : 2.12_spark3.2
33
34
DATAGEN_VERSION : 0.5.0-SNAPSHOT
34
35
steps :
35
36
- checkout
36
- - run :
37
- name : Install dependencies
38
- command : |
39
- mkdir out/
40
- DEBIAN_FRONTEND=noninteractive
41
- sudo apt update
42
- sudo apt install -y openjdk-8-jdk zip
43
- sudo update-alternatives --install /usr/bin/java java /usr/lib/jvm/java-8-openjdk-amd64/bin/java 1
44
- sudo update-alternatives --set java /usr/lib/jvm/java-8-openjdk-amd64/bin/java
45
37
- run :
46
38
name : Build Docker container
47
39
command : |
48
- docker build . -t ldbc/spark
49
- - restore_cache :
50
- keys :
51
- - m2-dep-branch:{{ .Branch }}-pom:{{ checksum "pom.xml" }}-
52
- - m2-dep-branch:dev-pom:{{ checksum "pom.xml" }}-
53
- - m2-dep-branch:{{ .Branch }}-
54
- - m2-dep-branch:dev-
55
- - run :
56
- name : Build JAR file
57
- command : |
58
- mvn -ntp clean test-compile assembly:assembly
59
- - save_cache :
60
- key : m2-dep-branch:{{ .Branch }}-pom:{{ checksum "pom.xml" }}-{{ epoch }}
61
- paths :
62
- - ~/.m2/repository # maven deps
40
+ docker build . --target=standalone --tag ldbc/datagen-standalone:latest
63
41
# BI
64
- - run :
42
+ - run :
65
43
name : Generate SF0.003 / BI / singular-projected CSVs
66
44
command : |
67
- tools/docker-run.sh --mode bi --scale-factor 0.003 --explode-edges --explode-attrs
45
+ tools/docker-run.sh -- -- mode bi --scale-factor 0.003 --explode-edges --explode-attrs
68
46
mv out/ social-network-sf0.003-bi-singular-projected-fk/
69
47
- run :
70
48
name : Generate SF0.003 / BI / singular-merged CSVs
71
49
command : |
72
- tools/docker-run.sh --mode bi --scale-factor 0.003 --explode-attrs
50
+ tools/docker-run.sh -- -- mode bi --scale-factor 0.003 --explode-attrs
73
51
mv out/ social-network-sf0.003-bi-singular-merged-fk/
74
52
- run :
75
53
name : Generate SF0.003 / BI / composite-projected CSVs
76
54
command : |
77
- tools/docker-run.sh --mode bi --scale-factor 0.003 --explode-edges
55
+ tools/docker-run.sh -- -- mode bi --scale-factor 0.003 --explode-edges
78
56
mv out/ social-network-sf0.003-bi-composite-projected-fk/
79
57
- run :
80
- name : Generate SF0.003 / BI / composite-merged CSVs
58
+ name : Generate SF0.003 / BI / composite-merged CSVs, generate factors
81
59
command : |
82
60
# we generate factors here but they are moved to a separate archive (social-network-sf0.003-bi-factors.zip)
83
- tools/docker-run.sh --mode bi --scale-factor 0.003 --generate-factors
61
+ tools/docker-run.sh -- -- mode bi --scale-factor 0.003 --generate-factors
84
62
mv out/ social-network-sf0.003-bi-composite-merged-fk/
85
63
- run :
86
64
name : Generate SF0.003 / BI / compressed composite-merged CSVs for Postgres
87
65
command : |
88
- tools/docker-run.sh --mode bi --scale-factor 0.003 --format-options compression=gzip
66
+ tools/docker-run.sh -- -- mode bi --scale-factor 0.003 --format-options compression=gzip
89
67
mv out/ social-network-sf0.003-bi-composite-merged-fk-postgres-compressed/
90
68
- run :
91
69
name : Generate SF0.003 / BI / composite-projected CSVs for Neo4j
92
70
command : |
93
- tools/docker-run.sh --mode bi --scale-factor 0.003 --explode-edges --format-options header=false,quoteAll=true
71
+ tools/docker-run.sh -- -- mode bi --scale-factor 0.003 --explode-edges --format-options header=false,quoteAll=true
94
72
mv out/ social-network-sf0.003-bi-composite-projected-fk-neo4j/
95
73
- run :
96
74
name : Generate SF0.003 / BI / compressed composite-projected CSVs for Neo4j
97
75
command : |
98
- tools/docker-run.sh --mode bi --scale-factor 0.003 --explode-edges --format-options header=false,quoteAll=true,compression=gzip
76
+ tools/docker-run.sh -- -- mode bi --scale-factor 0.003 --explode-edges --format-options header=false,quoteAll=true,compression=gzip
99
77
mv out/ social-network-sf0.003-bi-composite-projected-fk-neo4j-compressed/
100
- # Interactive
101
- - run :
102
- name : Generate SF0.003 / Interactive / singular-projected CSVs
103
- command : |
104
- tools/docker-run.sh --mode interactive --scale-factor 0.003 --explode-edges --explode-attrs
105
- mv out/ social-network-sf0.003-interactive-singular-projected-fk/
106
- - run :
107
- name : Generate SF0.003 / Interactive / singular-merged CSVs
108
- command : |
109
- tools/docker-run.sh --mode interactive --scale-factor 0.003 --explode-attrs
110
- mv out/ social-network-sf0.003-interactive-singular-merged-fk/
111
78
- run :
112
- name : Generate SF0.003 / Interactive / composite-projected CSVs
79
+ name : Generate SF0.003 / BI / compressed composite-projected CSVs for Neo4j with epoch milli timestamps
113
80
command : |
114
- tools/docker-run.sh --mode interactive --scale-factor 0.003 --explode-edges
115
- mv out/ social-network-sf0.003-interactive -composite-projected-fk/
81
+ tools/docker-run.sh -- -- mode bi --scale-factor 0.003 --explode-edges --epoch-millis --format-options header=false,quoteAll=true,compression=gzip
82
+ mv out/ social-network-sf0.003-bi -composite-projected-fk-neo4j-compressed-epoch-millis /
116
83
- run :
117
- name : Generate SF0.003 / Interactive / composite-merged CSVs
84
+ name : Generate SF0.003 / BI / compressed composite-projected CSVs for Neo4j with epoch milli timestamps
118
85
command : |
119
- tools/docker-run.sh --mode interactive --scale-factor 0.003
120
- mv out/ social-network-sf0.003-interactive-composite-merged-fk/
86
+ tools/docker-run.sh -- -- mode bi --scale-factor 0.003 --format parquet
87
+ mv out/ social-network-sf0.003-bi-parquet
121
88
- run :
122
89
name : Compress directories and prepare for deployment
123
90
command : |
124
91
# include the CircleCI configuration in the deployed package to provide the 'filters' instructions (and prevent failed builds on the gh-pages branch)
125
92
mv .circleci dist/
126
93
# move factors to a separate directory
127
94
mkdir social-network-sf0.003-bi-factors
128
- mv social-network-sf0.003-bi-composite-merged-fk/factors social-network-sf0.003-bi-factors/factors
95
+ cp -r social-network-sf0.003-bi-composite-merged-fk/factors social-network-sf0.003-bi-factors/factors
129
96
# compress each directory
130
97
for d in social-network-sf0.003*; do
131
98
echo "Generated with <https://github.com/ldbc/ldbc_snb_datagen_spark/commit/${CIRCLE_SHA1}>" > $d/README.md
0 commit comments