@@ -29,11 +29,22 @@ def __init__(
2929 PSMReader_w_FragBase .__init__ (
3030 self , frag_types = frag_types , max_frag_charge = max_frag_charge , ** kwargs
3131 )
32- pFindReader .__init__ (self )
32+ pFindReader .__init__ (
33+ self ,
34+ column_mapping = {
35+ "sequence" : "peptide" ,
36+ "charge" : "charge" ,
37+ "rt" : "RT" ,
38+ "raw_name" : "raw_name" ,
39+ "query_id" : "spec" ,
40+ "scan_num" : "scan_num" ,
41+ },
42+ )
3343
34- psmlabel_columns = "b,b-NH3,b-H20,b-ModLoss,y,y-HN3,y-H20,y-ModLoss" .split ("," )
3544 self .psmlabel_frag_columns = []
3645 self .frag_df_columns = {}
46+
47+ psmlabel_columns = "b,b-NH3,b-H20,b-ModLoss,y,y-HN3,y-H20,y-ModLoss" .split ("," )
3748 for _type in psmlabel_columns :
3849 frag_idxes = [
3950 i
@@ -44,18 +55,11 @@ def __init__(
4455 self .psmlabel_frag_columns .append (_type )
4556 self .frag_df_columns [_type ] = np .array (frag_idxes , dtype = int )
4657
47- def _init_column_mapping (self ):
48- self .column_mapping = {
49- "sequence" : "peptide" ,
50- "charge" : "charge" ,
51- "rt" : "RT" ,
52- "raw_name" : "raw_name" ,
53- "query_id" : "spec" ,
54- "scan_num" : "scan_num" ,
55- }
56-
5758 def _load_file (self , filename ):
58- psmlabel_df = pd .read_csv (filename , sep = "\t " )
59+ df = pd .read_csv (filename , sep = "\t " )
60+ return df
61+
62+ def _pre_process (self , psmlabel_df : pd .DataFrame ):
5963 psmlabel_df .fillna ("" , inplace = True )
6064
6165 if psmlabel_df ["spec" ].values [0 ].count ("." ) >= 4 : # pfind
@@ -79,16 +83,16 @@ def _load_modifications(self, psmlabel_df: pd.DataFrame):
7983 * psmlabel_df ["modinfo" ].apply (get_pFind_mods )
8084 )
8185
82- def _translate_decoy (self , df ):
86+ def _translate_decoy (self ):
8387 pass
8488
85- def _translate_score (self , df ):
89+ def _translate_score (self ):
8690 pass
8791
8892 def _translate_modifications (self ):
8993 self ._psm_df ["mods" ] = self ._psm_df ["mods" ].apply (translate_pFind_mod )
9094
91- def _post_process (self , psmlabel_df : pd . DataFrame ):
95+ def _post_process (self , psmlabel_df ):
9296 psmlabel_df ["nAA" ] = psmlabel_df .peptide .str .len ()
9397 self ._psm_df ["nAA" ] = psmlabel_df .nAA
9498 psmlabel_df = psmlabel_df [~ self ._psm_df ["mods" ].isna ()].reset_index (drop = True )
0 commit comments