@@ -217,7 +217,9 @@ def docs_data_process(path):
217
217
# schema process
218
218
print ("\n =================DUEE FINANCE DATASET==============" )
219
219
conf_dir = "./conf/DuEE-Fin"
220
- schema_path = "{}/event_schema.json" .format (conf_dir )
220
+ if not os .path .exists (conf_dir ):
221
+ os .makedirs (conf_dir )
222
+ schema_path = "./data/DuEE-fin/duee_fin_event_schema.json"
221
223
tags_trigger_path = "{}/trigger_tag.dict" .format (conf_dir )
222
224
tags_role_path = "{}/role_tag.dict" .format (conf_dir )
223
225
tags_enum_path = "{}/enum_tag.dict" .format (conf_dir )
@@ -245,11 +247,14 @@ def docs_data_process(path):
245
247
print ("\n ********** start document process **********" )
246
248
if not os .path .exists (sentence_dir ):
247
249
os .makedirs (sentence_dir )
248
- train_sent = docs_data_process ("{}/duee_fin_train.json" .format (data_dir ))
250
+ train_sent = docs_data_process (
251
+ "./data/DuEE-fin/duee_fin_train.json/duee_fin_train.json" )
249
252
write_by_lines ("{}/train.json" .format (sentence_dir ), train_sent )
250
- dev_sent = docs_data_process ("{}/duee_fin_dev.json" .format (data_dir ))
253
+ dev_sent = docs_data_process (
254
+ "./data/DuEE-fin/duee_fin_dev.json/duee_fin_dev.json" )
251
255
write_by_lines ("{}/dev.json" .format (sentence_dir ), dev_sent )
252
- test_sent = docs_data_process ("{}/duee_fin_test1.json" .format (data_dir ))
256
+ test_sent = docs_data_process (
257
+ "./data/DuEE-fin/duee_fin_test2.json/duee_fin_test2.json" )
253
258
write_by_lines ("{}/test.json" .format (sentence_dir ), test_sent )
254
259
print ("train {} dev {} test {}" .format (
255
260
len (train_sent ), len (dev_sent ), len (test_sent )))
0 commit comments