Skip to content

Commit 1dfcccf

Browse files
committed
added processing of copy_number master table
1 parent 3c1e18b commit 1dfcccf

File tree

1 file changed

+33
-0
lines changed

1 file changed

+33
-0
lines changed

scripts/prepare_data_for_improve.py

Lines changed: 33 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -373,8 +373,41 @@ def process_datasets(args):
373373
# create copynumber master table
374374
#-------------------------------------------------------------------
375375

376+
merged_copy_number = merge_master_tables(args, data_sets=data_sets, data_type='copy_number')
376377

378+
merged_copy_number = pd.merge(
379+
merged_copy_number,
380+
data_gene_names[[
381+
'entrez_id',
382+
'ensemble_gene_id',
383+
'gene_symbol'
384+
]],
385+
how='left',
386+
on='entrez_id',
387+
)
377388

389+
merged_copy_number.insert(
390+
1,
391+
'ensemble_gene_id',
392+
merged_copy_number.pop('ensemble_gene_id')
393+
)
394+
merged_copy_number.insert(
395+
1,
396+
'gene_symbol',
397+
merged_copy_number.pop('gene_symbol')
398+
)
399+
400+
# writing the expression datatable to '/x_data/*_copy_number.tsv'
401+
outfile_path = args.WORKDIR.joinpath(
402+
"data_out",
403+
"x_data",
404+
"cancer_copy_number.tsv"
405+
)
406+
merged_copy_number.transpose().to_csv(
407+
path_or_buf=outfile_path,
408+
sep='\t',
409+
header=False
410+
)
378411
# join the "meta data tables" like copynumber etc.
379412

380413

0 commit comments

Comments
 (0)