Skip to content

Commit 82bb655

Browse files
committed
Merge branch 'master' into readme-update
2 parents 7bb167b + 3a1c8fd commit 82bb655

File tree

4 files changed

+22
-26
lines changed

4 files changed

+22
-26
lines changed

bin/roosterize

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,5 +4,5 @@ _DIR=$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )
44

55

66
( cd $_DIR/../
7-
python -m roosterize.main $@
7+
python -m roosterize.main "$@"
88
)

dist-bin/roosterize

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -4,5 +4,5 @@ _DIR=$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )
44

55

66
( cd $_DIR/../
7-
./roosterize $@
7+
./roosterize "$@"
88
)

pretrain.sh

Lines changed: 17 additions & 23 deletions
Original file line numberDiff line numberDiff line change
@@ -9,27 +9,23 @@ _DIR=$( cd "$( dirname "${BASH_SOURCE[0]}" )" && pwd )
99
function process_data() {
1010
local ds=$1; shift
1111

12-
( cd $_DIR/python/
13-
rm -rf $_DIR/output/$ds/data
14-
python -m roosterize.main extract_data_from_corpus\
15-
--corpus=$_DIR/../math-comp-corpus\
16-
--output=$_DIR/output/$ds/data\
17-
--groups=$ds
18-
)
12+
rm -rf $_DIR/output/$ds/data
13+
python -m roosterize.main extract_data_from_corpus\
14+
--corpus=$_DIR/../math-comp-corpus\
15+
--output=$_DIR/output/$ds/data\
16+
--groups=$ds
1917
}
2018

2119
function train_model() {
2220
local ds=$1; shift
2321

24-
( cd $_DIR/python/
25-
rm -rf $_DIR/output/$ds/model
26-
python -m roosterize.main train_model\
27-
--train=$_DIR/output/$ds/data/$ds-train\
28-
--val=$_DIR/output/$ds/data/$ds-val\
29-
--model-dir=$_DIR/output/$ds/model\
30-
--output=$_DIR/output/$ds/data\
31-
--config-file=$_DIR/configs/Stmt+ChopKnlTree+attn+copy.json
32-
)
22+
rm -rf $_DIR/output/$ds/model
23+
python -m roosterize.main train_model\
24+
--train=$_DIR/output/$ds/data/$ds-train\
25+
--val=$_DIR/output/$ds/data/$ds-val\
26+
--model-dir=$_DIR/output/$ds/model\
27+
--output=$_DIR/output/$ds/data\
28+
--config-file=$_DIR/configs/Stmt+ChopKnlTree+attn+copy.json
3329
}
3430

3531
function package_model() {
@@ -43,13 +39,11 @@ function package_model() {
4339
function eval_model() {
4440
local ds=$1; shift
4541

46-
( cd $_DIR/python/
47-
rm -rf $_DIR/output/$ds/results
48-
python -m roosterize.main eval_model\
49-
--data=$_DIR/output/$ds/data/$ds-test\
50-
--model-dir=$_DIR/output/$ds/model\
51-
--output=$_DIR/output/$ds/results
52-
)
42+
rm -rf $_DIR/output/$ds/results
43+
python -m roosterize.main eval_model\
44+
--data=$_DIR/output/$ds/data/$ds-test\
45+
--model-dir=$_DIR/output/$ds/model\
46+
--output=$_DIR/output/$ds/results
5347
}
5448

5549
function retrain_all_models() {

roosterize/ml/naming/MultiSourceSeq2Seq.py

Lines changed: 3 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -349,7 +349,9 @@ def process_data_impl(
349349
# Inputs
350350
all_inputs: Dict[str, List[List[str]]] = self.get_all_inputs(lemmas, docs_sub_tokenizers)
351351
for input_type, src_sentences in all_inputs.items():
352-
IOUtils.dump(output_processed_data_dir/f"src.{input_type}.txt", src_sentences, IOUtils.Format.txtList)
352+
IOUtils.dump(output_processed_data_dir/f"src.{input_type}.txt",
353+
"".join([" ".join(sent) + "\n" for sent in src_sentences]),
354+
IOUtils.Format.txt)
353355

354356
# Outputs
355357
IOUtils.dump(

0 commit comments

Comments
 (0)