1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228 229 230 231 232 233 234 235 236 237 238 239 240 241 242 243 244 245 246 247 248 249 250 251 252 253 254 255 256 257 258 259 260 261 262 263 264 265 266 267 268 269 270 271 272 273 274 275 276 277 278 279 280 281 282 283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315 316 317 318 319 320 321 322 323 324 325 326 327 328 329 330 331 332 333 334 335 336 337 338 339 340 341 342 343 344 345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379 380 381 382 383 384 385 386 387 388 389 390 391 392 393 394 395 396 397 398 399 400 401 402 403 404 405 406 407 408 409 410 411 412 413 414 415 416 417 418 419 420 421 422 423 424 425 426 427 428 429 430 431 432 433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454
| system.time(compact_data <- TADA_A_read_info_by_chunks( mut_files = "/storage11_7T/fuy/TADA-A/cell_WES/cd_mis_pli_syn.7131DNM.allele.bed", # c("db/MS_data/DNM/Jiang_cases_DNM_with_allele_info.txt", # "db/MS_data/DNM/Kong_cases_DNM_with_allele_info.txt", # "db/MS_data/DNM/Michaelson_cases_DNM_with_allele_info.txt", # "db/MS_data/DNM/Yuen_NM2015_cases_DNM_with_allele_info.txt", # "db/MS_data/DNM/Wu_cases_DNM_with_allele_info.txt"), window_file = 'db/MS_data/windows_partition/cd_windows_with_div_score.bed', mutrate_scaling_files = c("/storage11_7T/fuy/TADA-A/cell_WES/cd_mis_pli_syn.7131DNM_6430fam_scaling_factors_x036.txt"), # sample_sizes = 4265, sample_sizes = 6430, # mutrate_scaling_files = c("db/MS_data/results/Jiang_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt", # "db/MS_data/results/Kong_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt", # "db/MS_data/results/Michaelson_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt", # "db/MS_data/results/Yuen_NM2015_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt", # "db/MS_data/results/Wu_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt"), # sample_sizes = c(32,78,10,162,32), gene_prior_file = "db/MS_data/prior/uniform_gene_prior.txt", nonAS_noncoding_annotations = NA, #c( # "/storage11_7T/fuy/TADA-A/annotation/ccr/ccrs.allchrom.gt90.bed"), #"/storage11_7T/fuy/TADA-A/annotation/ccr/chr_ccr_gt95_syn_rm.bed"),
AS_noncoding_annotations = list( ######################### interaction ##################### # c("/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex.altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex.altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex.altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex.altT.ccr90.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/MVP/MVP.altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/MVP/MVP.altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/MVP/MVP.altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/MVP/MVP.altT.ccr90.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/primateAI/primateAI.altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/primateAI/primateAI.altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/primateAI/primateAI.altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/primateAI/primateAI.altT.ccr90.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/MPC_score/MPC2.altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/MPC_score/MPC2.altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/MPC_score/MPC2.altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/MPC_score/MPC2.altT.ccr90.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced5.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced5.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced5.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced5.top5%_altT.ccr90.bed") ,
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced6.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced6.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced6.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced6.top5%_altT.ccr90.bed") ,
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced7.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced7.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced7.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced7.top5%_altT.ccr90.bed") ,
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced8.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced8.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced8.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced8.top5%_altT.ccr90.bed") ,
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced9.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced9.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced9.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced9.top5%_altT.ccr90.bed") ,
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced10.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced10.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced10.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced10.top5%_altT.ccr90.bed") ,
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced11.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced11.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced11.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced11.top5%_altT.ccr90.bed") ,
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced12.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced12.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced12.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced12.top5%_altT.ccr90.bed") ,
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced13.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced13.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced13.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced13.top5%_altT.ccr90.bed") ,
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced14.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced14.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced14.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced14.top5%_altT.ccr90.bed") ,
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced15.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced15.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced15.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced15.top5%_altT.ccr90.bed") ,
# c("/storage11_7T/fuy/TADA-A/annotation/RADAR_RBP/A.top001.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/RADAR_RBP/C.top001.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/RADAR_RBP/G.top001.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/RADAR_RBP/T.top001.ccr90.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/RBP-VarDB/RBP.ccr90.altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/RBP-VarDB/RBP.ccr90.altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/RBP-VarDB/RBP.ccr90.altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/RBP-VarDB/RBP.ccr90.altT.bed"), # #c("/storage11_7T/fuy/TADA-A/annotation/ribosnitch/ribosnitch.ccr90.altA.bed", # # "/storage11_7T/fuy/TADA-A/annotation/ribosnitch/ribosnitch.ccr90.altC.bed", # # "/storage11_7T/fuy/TADA-A/annotation/ribosnitch/ribosnitch.ccr90.altG.bed", # # "/storage11_7T/fuy/TADA-A/annotation/ribosnitch/ribosnitch.ccr90.altT.bed"), # # # #c("/storage11_7T/fuy/TADA-A/annotation/CLIPdb/CLIPdb.ccr90.altA.bed", # # "/storage11_7T/fuy/TADA-A/annotation/CLIPdb/CLIPdb.ccr90.altC.bed", # # "/storage11_7T/fuy/TADA-A/annotation/CLIPdb/CLIPdb.ccr90.altG.bed", # # "/storage11_7T/fuy/TADA-A/annotation/CLIPdb/CLIPdb.ccr90.altT.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced1.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced1.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced1.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced1.top5%_altT.ccr90.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced2.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced2.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced2.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced2.top5%_altT.ccr90.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced3.top5%_altA.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced3.top5%_altC.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced3.top5%_altG.ccr90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced3.top5%_altT.ccr90.bed"), # #c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced4.top5%_altA.ccr90.bed", # # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced4.top5%_altC.ccr90.bed", # # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced4.top5%_altG.ccr90.bed", # # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced/spliced4.top5%_altT.ccr90.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_A.bed.ccr.gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_C.bed.ccr.gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_G.bed.ccr.gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_T.bed.ccr.gt90.bed") , # # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain12_altA.bed", # # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain12_altC.bed", # # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain12_altG.bed", # # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain12_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_altA.bed.ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_altC.bed.ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_altG.bed.ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_altT.bed.ccr_gt90.bed"), #c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_primateAI_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_primateAI_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_primateAI_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_primateAI_altT.bed"), #c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain2_altA_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain2_altC_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain2_altG_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain2_altT_ccr_gt90.bed"), # #c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain3_altA_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain3_altC_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain3_altG_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain3_altT_ccr_gt90.bed"), # #c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain4_altA_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain4_altC_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain4_altG_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain4_altT_ccr_gt90.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain5_altA_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain5_altC_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain5_altG_ccr_gt90.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain5_altT_ccr_gt90.bed"), ######################## DeepSEA #######################
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain/brain1_altT.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain2_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain2_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain2_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain2_altT.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain3_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain3_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain3_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain3_altT.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain4_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain4_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain4_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain4_altT.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain5_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain5_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain5_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/brain5_altT.bed")
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced1.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced1.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced1.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced1.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced2.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced2.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced2.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced2.top5%_altT.bed") , # # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced3.top5%_altA.bed", # # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced3.top5%_altC.bed", # # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced3.top5%_altG.bed", # # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced3.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced4.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced4.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced4.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced4.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced5.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced5.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced5.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced5.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced6.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced6.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced6.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced6.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced7.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced7.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced7.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced7.top5%_altT.bed"),
# c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced8.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced8.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced8.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced8.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced9.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced9.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced9.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced9.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced10.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced10.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced10.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced10.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced11.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced11.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced11.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced11.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced12.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced12.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced12.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced12.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced13.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced13.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced13.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced13.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced14.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced14.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced14.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced14.top5%_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced15.top5%_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced15.top5%_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced15.top5%_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/DeepSEA/spliced_rbp/st.true.spliced15.top5%_altT.bed") , ####################### RADAR RBP ############################ # c("/storage11_7T/fuy/TADA-A/annotation/RADAR_RBP/A.top005.bed", # "/storage11_7T/fuy/TADA-A/annotation/RADAR_RBP/C.top005.bed", # "/storage11_7T/fuy/TADA-A/annotation/RADAR_RBP/G.top005.bed", # "/storage11_7T/fuy/TADA-A/annotation/RADAR_RBP/T.top005.bed") ####################### WES denovo ptv ############################ # c("/storage11_7T/fuy/TADA-A/annotation/pLI/denovo_pLI_snv_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/denovo_pLI_snv_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/denovo_pLI_snv_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/denovo_pLI_snv_alt_A.bed"), ####################### gnomad lof (PTV SNV: Nonsense, splice acceptor, and splice donor variants) ############################ # c("/storage11_7T/fuy/TADA-A/annotation/gnomad/gnomad.v2.1.1.all_lofs_snv_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/gnomad/gnomad.v2.1.1.all_lofs_snv_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/gnomad/gnomad.v2.1.1.all_lofs_snv_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/gnomad/gnomad.v2.1.1.all_lofs_snv_alt_T.bed"), ####################### gnomad PTV tiers ############################ # c("/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_nlt09_gnomad.v2.1.1.all_lofs_snv_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_nlt09_gnomad.v2.1.1.all_lofs_snv_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_nlt09_gnomad.v2.1.1.all_lofs_snv_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_nlt09_gnomad.v2.1.1.all_lofs_snv_alt_T.bed") # c("/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_05_995_gnomad.v2.1.1.all_lofs_snv_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_05_995_gnomad.v2.1.1.all_lofs_snv_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_05_995_gnomad.v2.1.1.all_lofs_snv_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_05_995_gnomad.v2.1.1.all_lofs_snv_alt_T.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_lt05_gnomad.v2.1.1.all_lofs_snv_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_lt05_gnomad.v2.1.1.all_lofs_snv_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_lt05_gnomad.v2.1.1.all_lofs_snv_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_lt05_gnomad.v2.1.1.all_lofs_snv_alt_T.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_nlt_995_gnomad.v2.1.1.all_lofs_snv_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_nlt_995_gnomad.v2.1.1.all_lofs_snv_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_nlt_995_gnomad.v2.1.1.all_lofs_snv_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/pLI_nlt_995_gnomad.v2.1.1.all_lofs_snv_alt_T.bed"), ####################### annova missense ############################ # c("/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_missense_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_missense_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_missense_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_missense_alt_T.bed"),
####################### annova lof ############################ # c("/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_T.bed"),
c("/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_A.nlt995.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_C.nlt995.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_G.nlt995.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_T.nlt995.bed") , c("/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_A.05-995.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_C.05-995.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_G.05-995.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_T.05-995.bed") , c("/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_A.ls05.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_C.ls05.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_G.ls05.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_lof_alt_T.ls05.bed") , ####################### annova syn ############################ c("/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_cd_syn_alt_A.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_cd_syn_alt_C.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_cd_syn_alt_G.bed", "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/all_cd_syn_alt_T.bed"), ####################### CADD ############################ # c("/storage11_7T/fuy/TADA-A/annotation/CADD/whole_genome_SNVs_gt15_altA_within_10kb_and_promoter_no_utr.bed", # "/storage11_7T/fuy/TADA-A/annotation/CADD/whole_genome_SNVs_gt15_altC_within_10kb_and_promoter_no_utr.bed", # "/storage11_7T/fuy/TADA-A/annotation/CADD/whole_genome_SNVs_gt15_altG_within_10kb_and_promoter_no_utr.bed", # "/storage11_7T/fuy/TADA-A/annotation/CADD/whole_genome_SNVs_gt15_altT_within_10kb_and_promoter_no_utr.bed"),
####################### RBP ############################ # c("/storage11_7T/fuy/TADA-A/annotation/RBP-VarDB/RBP.all.bed.merge_overlap_hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.1.altA.bed.merge_in_coding_windows.bed", # "/storage11_7T/fuy/TADA-A/annotation/RBP-VarDB/RBP.all.bed.merge_overlap_hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.1.altC.bed.merge_in_coding_windows.bed", # "/storage11_7T/fuy/TADA-A/annotation/RBP-VarDB/RBP.all.bed.merge_overlap_hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.1.altG.bed.merge_in_coding_windows.bed", # "/storage11_7T/fuy/TADA-A/annotation/RBP-VarDB/RBP.all.bed.merge_overlap_hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.1.altT.bed.merge_in_coding_windows.bed"),
# ###################### MVP ########################### # c("/storage11_7T/fuy/TADA-A/annotation/MVP/chr_MVP_all_rare_missense_pathogen_rank_gt_75_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/MVP/chr_MVP_all_rare_missense_pathogen_rank_gt_75_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/MVP/chr_MVP_all_rare_missense_pathogen_rank_gt_75_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/MVP/chr_MVP_all_rare_missense_pathogen_rank_gt_75_alt_T.bed"), # # ############################ primateAI ################################ # c("/storage11_7T/fuy/TADA-A/annotation/primateAI/chr_primateAI_exome_mutation_pathogen_rank_gt_80_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/primateAI/chr_primateAI_exome_mutation_pathogen_rank_gt_80_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/primateAI/chr_primateAI_exome_mutation_pathogen_rank_gt_80_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/primateAI/chr_primateAI_exome_mutation_pathogen_rank_gt_80_alt_T.bed"),
# # ########################## spidex ############################# # c("/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex_public_noncommercial_v1_0.tab_alt_A_lower10pct.bed", # "/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex_public_noncommercial_v1_0.tab_alt_C_lower10pct.bed", # "/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex_public_noncommercial_v1_0.tab_alt_G_lower10pct.bed", # "/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex_public_noncommercial_v1_0.tab_alt_T_lower10pct.bed"),
# ############## MPC ################## c("/storage11_7T/fuy/TADA-A/annotation/MPC_score/fordist_constraint_official_mpc_values_v2_MPC_gt2_altA.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/fordist_constraint_official_mpc_values_v2_MPC_gt2_altC.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/fordist_constraint_official_mpc_values_v2_MPC_gt2_altG.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/fordist_constraint_official_mpc_values_v2_MPC_gt2_altT.bed"), c("/storage11_7T/fuy/TADA-A/annotation/MPC_score/chr.MPC12_alt_A.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/chr.MPC12_alt_C.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/chr.MPC12_alt_G.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/chr.MPC12_alt_T.bed"), c("/storage11_7T/fuy/TADA-A/annotation/MPC_score/chr.MPC01_alt_A.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/chr.MPC01_alt_C.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/chr.MPC01_alt_G.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/chr.MPC01_alt_T.bed") #################### ribosnitch ########################### # c("/storage11_7T/fuy/TADA-A/annotation/ribosnitch/hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.1.altA.bed.merge.bed", # "/storage11_7T/fuy/TADA-A/annotation/ribosnitch/hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.1.altC.bed.merge.bed", # "/storage11_7T/fuy/TADA-A/annotation/ribosnitch/hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.1.altG.bed.merge.bed", # "/storage11_7T/fuy/TADA-A/annotation/ribosnitch/hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.1.altT.bed.merge.bed"), # c("/storage11_7T/fuy/TADA-A/annotation/ribosnitch/hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.05.merged.altA_in_coding_windows.bed", # "/storage11_7T/fuy/TADA-A/annotation/ribosnitch/hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.05.merged.altC_in_coding_windows.bed", # "/storage11_7T/fuy/TADA-A/annotation/ribosnitch/hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.05.merged.altG_in_coding_windows.bed", # "/storage11_7T/fuy/TADA-A/annotation/ribosnitch/hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.05.merged.altT_in_coding_windows.bed"), ###################### CLIPdb ############################ #c("/storage11_7T/fuy/TADA-A/annotation/CLIPdb/human_combine.merged_hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.05.merged.altA.bed", #"/storage11_7T/fuy/TADA-A/annotation/CLIPdb/human_combine.merged_hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.05.merged.altC.bed", #"/storage11_7T/fuy/TADA-A/annotation/CLIPdb/human_combine.merged_hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.05.merged.altG.bed", #"/storage11_7T/fuy/TADA-A/annotation/CLIPdb/human_combine.merged_hg19_refGenes_exons.gtf.lg.transc.fa.RNAsnpM3.bed.abspos.p0.05.merged.altT.bed") ),
report_proportion = 18665/18665, #chunk_partition_num =1, chunk = 2, node_n = 2, mutrate_ref_files = c("db/MS_data/mutrate/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_A.mutrate.bw", "db/MS_data/mutrate/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_C.mutrate.bw", "db/MS_data/mutrate/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_G.mutrate.bw", "db/MS_data/mutrate/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_T.mutrate.bw") # mutrate_ref_files = c("/storage11_7T/data.for.yuwen/new_mutrate/window.hg19.genome.tri2.alt_A.uq.bedGraph.sort.bw" , # "/storage11_7T/data.for.yuwen/new_mutrate/window.hg19.genome.tri2.alt_C.uq.bedGraph.sort.bw" , # "/storage11_7T/data.for.yuwen/new_mutrate/window.hg19.genome.tri2.alt_G.uq.bedGraph.sort.bw" , # "/storage11_7T/data.for.yuwen/new_mutrate/window.hg19.genome.tri2.alt_T.uq.bedGraph.sort.bw" )
))
saveRDS(compact_data,paste0("/storage11_7T/fuy/TADA-A/cell_WES/",Sys.Date(),"_wes_7131_annovar_pli_6430fam_x036_compact.rds"))
|