Skip to content

Commit f8f7ef1

Browse files
author
NilsFo
committed
Merge branch 'master' into zipped_h5
# Conflicts: # predict_batch.py
2 parents bd6e8fc + a005619 commit f8f7ef1

File tree

2 files changed

+144
-125
lines changed

2 files changed

+144
-125
lines changed

predict_batch.py

Lines changed: 82 additions & 51 deletions
Original file line numberDiff line numberDiff line change
@@ -22,8 +22,8 @@
2222

2323
# MODELS IN USE
2424
# Default trained for N1 normalisation
25-
model_source_path_oligo = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/models/results/oligo_final_sigmodal/0_custom/'
26-
model_source_path_neuron = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/models/results/neuron_final_sigmodal/0_custom/'
25+
model_source_path_oligo = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/models/results/oligo_final_sigmodal/0_custom/'
26+
model_source_path_neuron = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/models/results/neuron_final_sigmodal/0_custom/'
2727

2828
# MODELS TO DEBUG THAT FEATURE N4 NORMALISATION
2929
# modelSourcePath = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/models/debug-normalizing/oligo-n4/0_custom/'
@@ -32,11 +32,11 @@
3232
# MODELS TO BE VALIDATED
3333
# modelSourcePath = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/models/oligo_fieldTest_WObrightness_longer/0_custom/'
3434

35-
source_dir_oligo = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/final/oligo_14/'
36-
source_dir_neuron = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/final/neuron_14/'
35+
source_dir_oligo = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/final/oligo_18/'
36+
source_dir_neuron = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/final/neuron_18/'
3737

38-
source_dir_paper_redo_oligo = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/final/oligo_6/'
39-
source_dir_paper_redo_neuron = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/final/neuron_6/'
38+
source_dir_paper_redo_oligo = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/final/oligo_6/'
39+
source_dir_paper_redo_neuron = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/final/neuron_6/'
4040

4141
# ######### To validate, use these whole well experiments: #########
4242
# source_dir = '/prodi/bioinf/bioinfdata/work/omnisphero/CNN/wholeWell/oligo/unannotated/'
@@ -254,7 +254,7 @@ def main(args):
254254
print('Number of arguments:', len(args), 'arguments.')
255255
print('Argument List:', str(args))
256256

257-
custom_paths = False
257+
custom_paths = False;
258258
for arg in args:
259259
arg = str(arg).lower()
260260
print('Evaluating arg: "'+arg+'".')
@@ -273,67 +273,98 @@ def custom_paths_predict():
273273
print('Your input: '+model_source_path);
274274

275275

276-
pass
277-
278276

279277
def prodi_gpu_predict():
280278
print('Running Predictions.')
281-
use_oligo = False
279+
use_oligo = True
282280
use_neuron = True
281+
use_glia = False
282+
use_old = False
283283

284-
use_debug = True
285-
use_paper = False
284+
use_debug = False
285+
use_paper = True
286286
skip_predicted = True
287287
n_jobs: int = 20
288288

289289
# Paper Models trained for N4
290-
model_source_path_oligo_paper = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/training/debug/paper-final_datagen/oligo-normalize4/'
291-
model_source_path_neuron_paper = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/training/debug/paper-final_datagen/neuron-normalize4/'
290+
model_source_path_oligo_paper = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/training/debug/paper-final_datagen/oligo-normalize4/'
291+
model_source_path_neuron_paper = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/training/debug/paper-final_datagen/neuron-normalize4/'
292+
model_source_path_glia = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN-glia/models/glia/smote/'
293+
294+
# .h5 dirs to be predicted for the paper
295+
# source_dir_redo_paper_oligo = '/prodi/bioinf/bioinfdata/work/omnisphero/CNN/final/oligo_paper/'
296+
# source_dir_redo_paper_neuron = '/prodi/bioinf/bioinfdata/work/omnisphero/CNN/final/neuron_paper/rosi/'
297+
298+
# .h5 dirs to be predicted for efsa or endpoints
299+
source_dir_paper_oligo = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/final/oligo_endpoints5/'
300+
source_dir_paper_neuron = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/final/neuron_endpoints5/'
301+
302+
source_dir_paper_oligo2 = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/final/oligo_endpoints6/'
303+
source_dir_paper_neuron2 = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/final/neuron_endpoints6/'
304+
305+
source_dir_glia = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN/final/glia_01/'
306+
307+
308+
if use_glia:
309+
predict_batch(model_source_path=model_source_path_glia, source_dir=source_dir_glia,
310+
normalize_enum=4,
311+
n_jobs=n_jobs,
312+
skip_predicted=skip_predicted,
313+
gpu_index_string="0")
292314

293-
# .h dirs to be predicted for the paper
294-
source_dir_redo_paper_oligo = '/prodi/bioinf/bioinfdata/work/omnisphero/CNN/final/oligo_paper/'
295-
source_dir_redo_paper_neuron = '/prodi/bioinf/bioinfdata/work/omnisphero/CNN/final/neuron_paper/rosi/'
296315

297-
# source_dir_redo_paper_oligo = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/final/oligo_13/'
298-
# source_dir_redo_paper_neuron = '/prodi/bioinf/bioinfdata/work/Omnisphero/CNN/final/neuron_13/'
316+
if use_paper:
317+
if use_neuron:
318+
predict_batch(model_source_path=model_source_path_neuron_paper, source_dir=source_dir_paper_neuron,
319+
normalize_enum=4,
320+
n_jobs=n_jobs,
321+
skip_predicted=skip_predicted,
322+
gpu_index_string="0")
323+
324+
predict_batch(model_source_path=model_source_path_neuron_paper, source_dir=source_dir_paper_neuron2,
325+
normalize_enum=4,
326+
n_jobs=n_jobs,
327+
skip_predicted=skip_predicted,
328+
gpu_index_string="0")
329+
if use_oligo:
330+
predict_batch(model_source_path=model_source_path_oligo_paper, source_dir=source_dir_paper_oligo,
331+
normalize_enum=4,
332+
n_jobs=n_jobs,
333+
skip_predicted=skip_predicted,
334+
gpu_index_string="0")
335+
predict_batch(model_source_path=model_source_path_oligo_paper, source_dir=source_dir_paper_oligo2,
336+
normalize_enum=4,
337+
n_jobs=n_jobs,
338+
skip_predicted=skip_predicted,
339+
gpu_index_string="0")
340+
if use_old:
341+
if use_neuron:
342+
predict_batch(model_source_path=model_source_path_neuron, source_dir=source_dir_neuron,
343+
normalize_enum=1,
344+
n_jobs=n_jobs,
345+
skip_predicted=skip_predicted,
346+
gpu_index_string="0")
347+
if use_oligo:
348+
predict_batch(model_source_path=model_source_path_oligo, source_dir=source_dir_oligo,
349+
normalize_enum=1,
350+
n_jobs=n_jobs,
351+
skip_predicted=skip_predicted,
352+
gpu_index_string="1")
353+
299354

300355
if use_debug:
356+
predict_batch(model_source_path=model_source_path_oligo_paper,
357+
source_dir=source_dir_oligo,
358+
normalize_enum=4,
359+
n_jobs=n_jobs,
360+
skip_predicted=False,
361+
gpu_index_string="0")
301362
predict_batch(model_source_path=model_source_path_neuron_paper,
302-
source_dir='/prodi/bioinf/bioinfdata/work/omnisphero/CNN/final/neuron_debug/',
363+
source_dir=source_dir_neuron,
303364
normalize_enum=4,
304-
n_jobs=1,
365+
n_jobs=n_jobs,
305366
skip_predicted=False,
306367
gpu_index_string="0")
307-
else:
308-
if use_paper:
309-
if use_neuron:
310-
predict_batch(model_source_path=model_source_path_neuron_paper, source_dir=source_dir_redo_paper_neuron,
311-
normalize_enum=4,
312-
n_jobs=n_jobs,
313-
skip_predicted=skip_predicted,
314-
gpu_index_string="0")
315-
if use_oligo:
316-
predict_batch(model_source_path=model_source_path_oligo_paper, source_dir=source_dir_redo_paper_oligo,
317-
normalize_enum=4,
318-
n_jobs=n_jobs,
319-
skip_predicted=skip_predicted,
320-
gpu_index_string="1")
321-
else:
322-
if use_neuron:
323-
predict_batch(model_source_path=model_source_path_neuron, source_dir=source_dir_neuron,
324-
normalize_enum=1,
325-
n_jobs=n_jobs,
326-
skip_predicted=skip_predicted,
327-
gpu_index_string="0")
328-
329-
if use_oligo:
330-
predict_batch(model_source_path=model_source_path_oligo, source_dir=source_dir_oligo,
331-
normalize_enum=1,
332-
n_jobs=n_jobs,
333-
skip_predicted=skip_predicted,
334-
gpu_index_string="1")
335-
336-
337368

338369
print(gct() + ' All Predictions done. Have a nice day. =)')
339370

train_model.py

Lines changed: 62 additions & 74 deletions
Original file line numberDiff line numberDiff line change
@@ -1145,91 +1145,79 @@ def decode_history_key(key: str) -> str:
11451145
return key
11461146

11471147

1148+
glia_path_train = [
1149+
'/home/nilfoe/bioinf/Omnisphero/CNN-glia/training/glia/JK247_ECM pretreated_trainingData_glia',
1150+
'/home/nilfoe/bioinf/Omnisphero/CNN-glia/training/glia/JK247_spheres pretreated_trainingData_glia',
1151+
'/home/nilfoe/bioinf/Omnisphero/CNN-glia/training/glia/JK274_normal_trainingData_glia',
1152+
'/home/nilfoe/bioinf/Omnisphero/CNN-glia/training/glia/VJK135_trainingData_glia',
1153+
'/home/nilfoe/bioinf/Omnisphero/CNN-glia/training/glia/VJK136_trainingData_glia'
1154+
]
1155+
1156+
glia_path_test='/home/nilfoe/bioinf/Omnisphero/CNN-glia/test/glia/'
1157+
1158+
glia_path_val = [
1159+
'/home/nilfoe/bioinf/Omnisphero/CNN-glia/validation/glia/'
1160+
]
1161+
11481162
def main():
11491163
# AUGMENTATION
11501164
data_gen = get_default_augmenter()
1165+
n_jobs = 20
11511166

1152-
out_path_base = out_path + 'paper-final_no-datagen' + os.sep
1153-
out_path_oligo = out_path_base + 'oligo' + os.sep
1154-
out_path_neuron = out_path_base + 'neuron' + os.sep
1155-
1156-
out_path_oligo_debug = out_path_base + 'oligo_debug' + os.sep
1157-
1158-
oligo_mode = True
1159-
neuron_mode = False
1160-
debug_mode = False
1161-
n_jobs = 40
1167+
out_path = '/home/nilfoe/prodi/bioinfdata/work/Omnisphero/CNN-glia/models/glia-extendedData/'
11621168

11631169
print('Sleeping....')
11641170
# time.sleep(18000)
11651171

1166-
if debug_mode:
1167-
train_model(
1168-
training_path_list=debug_oligos,
1169-
validation_path_list=debug_oligos_validation,
1170-
test_data_path='/prodi/bioinf/bioinfdata/work/omnisphero/CNN/training/oligo_kontrolliert_test/',
1171-
# data_gen=data_gen,
1172-
use_SMOTE=False,
1173-
out_path=out_path + 'paper-final_datagen' + os.sep + 'neuron_kontrolliert_undersampled' + os.sep,
1174-
gpu_index_string="3",
1175-
optimizer='SGD',
1176-
normalize_enum=4,
1177-
under_sample_train_data=True, under_sample_val_data=True,
1178-
epochs=5,
1179-
n_jobs=25
1180-
)
1181-
return
1172+
train_model(
1173+
training_path_list=glia_path_train,
1174+
validation_path_list=glia_path_val,
1175+
test_data_path=glia_path_test,
1176+
use_SMOTE=False,
1177+
out_path=out_path + 'base' + os.sep,
1178+
gpu_index_string="0",
1179+
optimizer='SGD',
1180+
n_jobs=n_jobs,
1181+
epochs=5000
1182+
)
11821183

1183-
if oligo_mode:
1184-
train_model(
1185-
training_path_list=final_oligos_validated,
1186-
validation_path_list=final_oligos_validated_validation_set,
1187-
test_data_path=test_data_path_oligo,
1188-
# training_path_list=oligo_paper_bleedthrough_path_train,
1189-
# validation_path_list=oligo_paper_bleedthrough_path_val,
1190-
# test_data_path=oligo_paper_bleedthrough_path_test,
1191-
# data_gen=data_gen,
1192-
use_SMOTE=False,
1193-
out_path=out_path + 'paper-final_datagen' + os.sep + 'oligo-normalize4-undersampling' + os.sep,
1194-
under_sample_train_data=True, under_sample_val_data=True,
1195-
gpu_index_string="1",
1196-
optimizer='SGD',
1197-
n_jobs=n_jobs,
1198-
epochs=5000
1199-
)
1184+
train_model(
1185+
training_path_list=glia_path_train,
1186+
validation_path_list=glia_path_val,
1187+
test_data_path=glia_path_test,
1188+
use_SMOTE=False,
1189+
out_path=out_path + 'datagen' + os.sep,
1190+
gpu_index_string="0",
1191+
optimizer='SGD',
1192+
n_jobs=n_jobs,
1193+
data_gen=data_gen,
1194+
epochs=5000
1195+
)
12001196

1201-
# paper-final_no-datagen\neuron
1202-
if neuron_mode:
1203-
train_model(
1204-
training_path_list=final_neurons_validated,
1205-
validation_path_list=final_neurons_validated_validation_set,
1206-
test_data_path=test_data_path_neuron,
1207-
# training_path_list=neuron_paper_bleedthrough_path_train,
1208-
# validation_path_list=neuron_paper_bleedthrough_path_val,
1209-
# test_data_path=neuron_paper_bleedthrough_path_test,
1210-
# data_gen=data_gen,
1211-
use_SMOTE=False,
1212-
out_path=out_path + 'paper-final_datagen' + os.sep + 'neuron-normalize4-undersampling' + os.sep,
1213-
under_sample_train_data=True, under_sample_val_data=True,
1214-
normalize_enum=4,
1215-
gpu_index_string="0",
1216-
optimizer='SGD',
1217-
n_jobs=n_jobs,
1218-
epochs=5000
1219-
)
1197+
train_model(
1198+
training_path_list=glia_path_train,
1199+
validation_path_list=glia_path_val,
1200+
test_data_path=glia_path_test,
1201+
use_SMOTE=True,
1202+
out_path=out_path + 'smote' + os.sep,
1203+
gpu_index_string="0",
1204+
optimizer='SGD',
1205+
n_jobs=n_jobs,
1206+
epochs=5000
1207+
)
12201208

1221-
# out_path_oligo = out_path+'oligo'+os.sep
1222-
# out_path_neuron = out_path+'neuron'+os.sep
1223-
1224-
#
1225-
# train_model_scrambling(path_candidate_list=final_oligos_validated,
1226-
# test_data_path=test_data_path_oligo,
1227-
# out_path=out_path_oligo,
1228-
# validation_count=1)
1229-
# train_model_scrambling(path_candidate_list=final_neurons_validated,
1230-
# test_data_path=test_data_path_neuron,
1231-
# out_path=out_path_neuron,
1232-
# validation_count=1)
1209+
train_model(
1210+
training_path_list=glia_path_train,
1211+
validation_path_list=glia_path_val,
1212+
test_data_path=glia_path_test,
1213+
use_SMOTE=True,
1214+
out_path=out_path + 'datagen_and_smote' + os.sep,
1215+
gpu_index_string="0",
1216+
optimizer='SGD',
1217+
n_jobs=n_jobs,
1218+
data_gen=data_gen,
1219+
epochs=5000
1220+
)
12331221

12341222
print('Finished all trainings. Goodbye.')
12351223

0 commit comments

Comments
 (0)