Skip to content

Commit 2cf0e85

Browse files
committed
Employ a single merged jSRE model (element or mineral), and output target_ids in extracted relations.
1 parent 77f383e commit 2cf0e85

File tree

1 file changed

+10
-3
lines changed

1 file changed

+10
-3
lines changed

src/parserindexer/parse_all.py

Lines changed: 10 additions & 3 deletions
Original file line numberDiff line numberDiff line change
@@ -101,7 +101,11 @@ def parse_file(self, path):
101101
out.close()
102102

103103
# Call jSRE extraction (prediction)
104-
self.jsre_parser.predict(self.jsre_model + jsre_fn[4:] + '.model',
104+
# This version works if you want to call separate
105+
# element, mineral models.
106+
#self.jsre_parser.predict(self.jsre_model + jsre_fn[4:] + '.model',
107+
# This version works if you want one merged model.
108+
self.jsre_parser.predict(self.jsre_model,
105109
jsre_fn, jsre_fn + '_out')
106110

107111
rel = []
@@ -122,11 +126,14 @@ def parse_file(self, path):
122126
# To store in Solr:
123127
cont = {
124128
'label': 'contains', # also stored as 'type'
125-
# target_names_ss (list), cont_names_ss (list)
129+
# target_names (list), cont_names (list)
126130
'target_names': [canonical_target_name(ex[0]['word'])],
127131
'cont_names': [canonical_name(ex[1]['word'])],
128-
# cont_ids_ss (list)
132+
# target_ids (list), cont_ids (list)
129133
# - p_id prepended in indexer.py
134+
'target_ids': ['%s_%d_%d' % (ex[0]['ner'].lower(),
135+
ex[0]['characterOffsetBegin'],
136+
ex[0]['characterOffsetEnd'])],
130137
'cont_ids': ['%s_%d_%d' % (ex[1]['ner'].lower(),
131138
ex[1]['characterOffsetBegin'],
132139
ex[1]['characterOffsetEnd'])],

0 commit comments

Comments
 (0)