forked from hgrandjean/Anti-Fungi-Peptide
-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathsplit.py
More file actions
27 lines (24 loc) · 961 Bytes
/
split.py
File metadata and controls
27 lines (24 loc) · 961 Bytes
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
import math
with open("kmr_pos_temp/pos.kmr" , "r") as pos :
positive = list (pos.readlines()) #replace set by something else
with open("kmr_neg_temp/neg.kmr" , "r") as neg :
negative = list (neg.readlines()) #replace set by something else
#count of descriptors in positive then in negative list
kmers_counter={}
for kmer in positive:
if kmer in kmers_counter.keys() :
kmers_counter[kmer][0] +=1
else :
kmers_counter[kmer] = [1,0,0]
for kmer in negative:
if kmer in kmers_counter.keys() :
kmers_counter[kmer][1] +=1
else :
kmers_counter[kmer] = [0,1, 0]
#score attribution to each descriptor
for kmer in kmers_counter.keys() :
kmers_counter[kmer][2] = math.log((kmers_counter[kmer][0]+1)/(kmers_counter[kmer][1]+1))
#save data to tsv file
with open("unique_set.tsv" , "w") as save :
for kmer in kmers_counter.keys() :
save.write(str(kmer).strip()+'\t'+str(kmers_counter[kmer])+'\n')