@@ -151,14 +151,43 @@ regtools_data = subset(regtools_data, select=columns_to_keep)
151
151
152
152
# zeroes need to be added in for some samples
153
153
a <- function (x , y , z ){
154
- toAdd <- y - length(x ) - str_count( z , ' , ' ) - 1
154
+ toAdd <- y - length(x ) - 1
155
155
# browser()
156
156
toAdd <- rep(0.0000000 , toAdd )
157
157
x <- c(x , toAdd )
158
158
return (x )
159
159
}
160
160
x <- mapply(a , regtools_data $ norm_scores_non , length(all_samples ), regtools_data $ samples )
161
+
162
+
163
+ # if (typeof(x) == 'list') {
164
+ # x <- matrix(pad(unlist(x), ncols),nrow = rows, byrow = TRUE, ncol = cols)
165
+ # x <- t(x)
166
+ # }
167
+ # browser()
168
+
169
+ get_num_zeros_to_rm <- function (z ){
170
+ num_zeroes_to_rm = str_count(z , ' ,' )
171
+ return (num_zeroes_to_rm )
172
+ }
173
+
174
+ num_zeroes_to_rm <- mapply(get_num_zeros_to_rm , regtools_data $ samples )
175
+
176
+ x = split(x , rep(1 : ncol(x ), each = nrow(x )))
161
177
regtools_data $ norm_scores_non = x
178
+ regtools_data $ zeroes_to_rm = num_zeroes_to_rm
179
+
180
+ rm_zeroes <- function (x ,y ){
181
+ new_length <- length(x ) - y
182
+ x <- sort(x ,decreasing = TRUE )
183
+ x <- x [1 : new_length ]
184
+ return (x )
185
+ }
186
+
187
+ if (max(num_zeroes_to_rm > 0 )) {
188
+ x <- mapply(rm_zeroes , regtools_data $ norm_scores_non , regtools_data $ zeroes_to_rm )
189
+ regtools_data $ norm_scores_non = x
190
+ }
162
191
print(" test7" )
163
192
164
193
# ############### calculate p-values ############################################
@@ -187,8 +216,8 @@ a <- function(x){
187
216
}
188
217
189
218
regtools_data $ p_value <- apply(regtools_data , 1 , a )
190
- print(" test8 " )
191
-
219
+ print(" Number of rows in data.table " )
220
+ print(length( regtools_data $ samples ))
192
221
193
222
paste_commas <- function (v ){
194
223
return (paste(v ,collapse = " ," ))
@@ -203,7 +232,7 @@ regtools_data = subset(regtools_data, select=columns_to_keep)
203
232
colnames(regtools_data ) <- c(' variant_samples' , ' variant_info' , ' genes' , ' junction_samples' , " chrom" , " start" , " end" , ' strand' , ' anchor' , ' variant_junction_info' ,
204
233
' names' , ' mean_norm_score_variant' , ' sd_norm_score_variant' , ' norm_scores_variant' ,
205
234
' total_score_variant' , ' mean_norm_score_non' , ' sd_norm_score_non' , ' norm_scores_non' ,
206
- ' total_score_non' , ' p_value ' )
235
+ ' total_score_non' , ' pvalue ' )
207
236
regtools_data $ sd_norm_score_variant [is.na(regtools_data $ sd_norm_score_variant )] = 0
208
237
regtools_data $ mean_norm_score_non [is.na(regtools_data $ mean_norm_score_non )] = 0
209
238
regtools_data $ sd_norm_score_non [is.na(regtools_data $ sd_norm_score_non )] = 0
@@ -213,6 +242,6 @@ all_splicing_variants <- as.data.table(all_splicing_variants)
213
242
regtools_data = regtools_data %> % distinct()
214
243
215
244
216
- write.table(regtools_data , file = paste(input_file , " _out_test .tsv" , sep = " " ), quote = FALSE , sep = ' \t ' , row.names = F )
245
+ write.table(regtools_data , file = paste(input_file , " _out .tsv" , sep = " " ), quote = FALSE , sep = ' \t ' , row.names = F )
217
246
218
247
})
0 commit comments