1+ #! /bin/bash
2+ # -------------------------------------------------------------
3+ #
4+ # Licensed to the Apache Software Foundation (ASF) under one
5+ # or more contributor license agreements. See the NOTICE file
6+ # distributed with this work for additional information
7+ # regarding copyright ownership. The ASF licenses this file
8+ # to you under the Apache License, Version 2.0 (the
9+ # "License"); you may not use this file except in compliance
10+ # with the License. You may obtain a copy of the License at
11+ #
12+ # http://www.apache.org/licenses/LICENSE-2.0
13+ #
14+ # Unless required by applicable law or agreed to in writing,
15+ # software distributed under the License is distributed on an
16+ # "AS IS" BASIS, WITHOUT WARRANTIES OR CONDITIONS OF ANY
17+ # KIND, either express or implied. See the License for the
18+ # specific language governing permissions and limitations
19+ # under the License.
20+ #
21+ # -------------------------------------------------------------
22+ if [ " $( basename $PWD ) " != " perftest" ];
23+ then
24+ echo " Please execute scripts from directory 'perftest'"
25+ exit 1;
26+ fi
27+
28+ CMD=$1
29+ BASE=$2 /binomial
30+ MAXMEM=$3
31+
32+ FORMAT=" binary" # can be csv, mm, text, binary
33+ DENSE_SP=0.9
34+ SPARSE_SP=0.01
35+
36+ echo -e " \n\n-- Generating binomial data..." >> results/times.txt;
37+
38+ # generate XS scenarios (80MB)
39+ if [ $MAXMEM -ge 80 ]; then
40+ ${CMD} -f datagen/genRandData4LogisticRegression.dml --args 10000 1000 5 5 ${BASE} /w10k_1k_dense ${BASE} /X10k_1k_dense ${BASE} /y10k_1k_dense 1 0 $DENSE_SP $FORMAT 1 & pidDense80=$!
41+ ${CMD} -f datagen/genRandData4LogisticRegression.dml --args 10000 1000 5 5 ${BASE} /w10k_1k_sparse ${BASE} /X10k_1k_sparse ${BASE} /y10k_1k_sparse 1 0 $SPARSE_SP $FORMAT 1 & pidSparse80=$!
42+ wait $pidDense80 ; ${CMD} -f scripts/extractTestData.dml --args ${BASE} /X10k_1k_dense ${BASE} /y10k_1k_dense ${BASE} /X10k_1k_dense_test ${BASE} /y10k_1k_dense_test $FORMAT &
43+ wait $pidSparse80 ; ${CMD} -f scripts/extractTestData.dml --args ${BASE} /X10k_1k_sparse ${BASE} /y10k_1k_sparse ${BASE} /X10k_1k_sparse_test ${BASE} /y10k_1k_sparse_test $FORMAT &
44+ fi
45+
46+ # #generate S scenarios (800MB)
47+ if [ $MAXMEM -ge 800 ]; then
48+ ${CMD} -f datagen/genRandData4LogisticRegression.dml --args 100000 1000 5 5 ${BASE} /w100k_1k_dense ${BASE} /X100k_1k_dense ${BASE} /y100k_1k_dense 1 0 $DENSE_SP $FORMAT 1 & pidDense800=$!
49+ ${CMD} -f datagen/genRandData4LogisticRegression.dml --args 100000 1000 5 5 ${BASE} /w100k_1k_sparse ${BASE} /X100k_1k_sparse ${BASE} /y100k_1k_sparse 1 0 $SPARSE_SP $FORMAT 1 & pidSparse800=$!
50+ wait $pidDense800 ; ${CMD} -f scripts/extractTestData.dml --args ${BASE} /X100k_1k_dense ${BASE} /y100k_1k_dense ${BASE} /X100k_1k_dense_test ${BASE} /y100k_1k_dense_test $FORMAT &
51+ wait $pidSparse800 ; ${CMD} -f scripts/extractTestData.dml --args ${BASE} /X100k_1k_sparse ${BASE} /y100k_1k_sparse ${BASE} /X100k_1k_sparse_test ${BASE} /y100k_1k_sparse_test $FORMAT &
52+ fi
53+
54+ # generate M scenarios (8GB)
55+ if [ $MAXMEM -ge 8000 ]; then
56+ ${CMD} -f datagen/genRandData4LogisticRegression.dml --args 1000000 1000 5 5 ${BASE} /w1M_1k_dense ${BASE} /X1M_1k_dense ${BASE} /y1M_1k_dense 1 0 $DENSE_SP $FORMAT 1 & pidDense8000=$!
57+ ${CMD} -f datagen/genRandData4LogisticRegression.dml --args 1000000 1000 5 5 ${BASE} /w1M_1k_sparse ${BASE} /X1M_1k_sparse ${BASE} /y1M_1k_sparse 1 0 $SPARSE_SP $FORMAT 1 & pidSparse8000=$!
58+ wait $pidDense8000 ; ${CMD} -f scripts/extractTestData.dml --args ${BASE} /X1M_1k_dense ${BASE} /y1M_1k_dense ${BASE} /X1M_1k_dense_test ${BASE} /y1M_1k_dense_test $FORMAT &
59+ wait $pidSparse8000 ; ${CMD} -f scripts/extractTestData.dml --args ${BASE} /X1M_1k_sparse ${BASE} /y1M_1k_sparse ${BASE} /X1M_1k_sparse_test ${BASE} /y1M_1k_sparse_test $FORMAT &
60+ fi
61+
62+ # generate L scenarios (80GB)
63+ if [ $MAXMEM -ge 80000 ]; then
64+ ${CMD} -f datagen/genRandData4LogisticRegression.dml --args 10000000 1000 5 5 ${BASE} /w10M_1k_dense ${BASE} /X10M_1k_dense ${BASE} /y10M_1k_dense 1 0 $DENSE_SP $FORMAT 1
65+ ${CMD} -f datagen/genRandData4LogisticRegression.dml --args 10000000 1000 5 5 ${BASE} /w10M_1k_sparse ${BASE} /X10M_1k_sparse ${BASE} /y10M_1k_sparse 1 0 $SPARSE_SP $FORMAT 1
66+ ${CMD} -f scripts/extractTestData.dml --args ${BASE} /X10M_1k_dense ${BASE} /y10M_1k_dense ${BASE} /X10M_1k_dense_test ${BASE} /y10M_1k_dense_test $FORMAT
67+ ${CMD} -f scripts/extractTestData.dml --args ${BASE} /X10M_1k_sparse ${BASE} /y10M_1k_sparse ${BASE} /X10M_1k_sparse_test ${BASE} /y10M_1k_sparse_test $FORMAT
68+ fi
69+
70+ # #generate XL scenarios (800GB)
71+ if [ $MAXMEM -ge 800000 ]; then
72+ ${CMD} -f datagen/genRandData4LogisticRegression.dml --args 100000000 1000 5 5 ${BASE} /w100M_1k_dense ${BASE} /X100M_1k_dense ${BASE} /y100M_1k_dense 1 0 $DENSE_SP $FORMAT 1
73+ ${CMD} -f datagen/genRandData4LogisticRegression.dml --args 100000000 1000 5 5 ${BASE} /w100M_1k_sparse ${BASE} /X100M_1k_sparse ${BASE} /y100M_1k_sparse 1 0 $SPARSE_SP $FORMAT 1
74+ ${CMD} -f scripts/extractTestData.dml --args ${BASE} /X100M_1k_dense ${BASE} /y100M_1k_dense ${BASE} /X100M_1k_dense_test ${BASE} /y100M_1k_dense_test $FORMAT
75+ ${CMD} -f scripts/extractTestData.dml --args ${BASE} /X100M_1k_sparse ${BASE} /y100M_1k_sparse ${BASE} /X100M_1k_sparse_test ${BASE} /y100M_1k_sparse_test $FORMAT
76+ fi
77+
78+ wait
0 commit comments