1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111
| system.time(compact_data <- TADA_A_read_info_by_chunks( mut_files = "/storage11_7T/fuy/TADA-A/cell_WES/DNM/12166DNM.affected.allele.bed", # c("db/MS_data/DNM/Jiang_cases_DNM_with_allele_info.txt", # "db/MS_data/DNM/Kong_cases_DNM_with_allele_info.txt", # "db/MS_data/DNM/Michaelson_cases_DNM_with_allele_info.txt", # "db/MS_data/DNM/Yuen_NM2015_cases_DNM_with_allele_info.txt", # "db/MS_data/DNM/Wu_cases_DNM_with_allele_info.txt"), window_file = 'db/MS_data/windows_partition/cd_windows_with_div_score.bed', # mutrate_scaling_files = c("/storage11_7T/fuy/TADA-A/cell_WES/cd_uniform_scaling_factors_1441_d_1692.txt"), # mutrate_scaling_files = c("/storage11_7T/fuy/TADA-A/cell_WES/cd_uniform_scaling_factors.txt"), # mutrate_scaling_files = c("/storage11_7T/fuy/TADA-A/cell_WES/cd_uniform_scaling_factors_1441_d_1068.txt"), # mutrate_scaling_files = c("/storage11_7T/fuy/TADA-A/cell_WES/cd_uniform_scaling_factors_1435_d_1052.txt"), # mutrate_scaling_files = c("/storage11_7T/fuy/TADA-A/cell_WES/cd_uniform_scaling_factors_1505_d_1692.txt"), mutrate_scaling_files = c("/storage11_7T/fuy/TADA-A/cell_WES/cd_uniform_scaling_factors_1484_d_1630.txt"), sample_sizes = 6430, # sample_sizes = 4059, # sample_sizes = 4000, # mutrate_scaling_files = c("db/MS_data/results/Jiang_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt", # "db/MS_data/results/Kong_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt", # "db/MS_data/results/Michaelson_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt", # "db/MS_data/results/Yuen_NM2015_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt", # "db/MS_data/results/Wu_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt"), # sample_sizes = c(32,78,10,162,32), gene_prior_file = "db/MS_data/prior/uniform_gene_prior.txt", nonAS_noncoding_annotations = NA, #c( # "/storage11_7T/fuy/TADA-A/annotation/ccr/ccrs.allchrom.gt90.bed"), #"/storage11_7T/fuy/TADA-A/annotation/ccr/chr_ccr_gt95_syn_rm.bed"),
AS_noncoding_annotations = list(
# c("/storage11_7T/fuy/TADA-A/annotation/driverMAPS/autos.cd.window.all_cd_syn_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/autos.cd.window.all_cd_syn_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/autos.cd.window.all_cd_syn_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/driverMAPS/autos.cd.window.all_cd_syn_alt_T.bed") c("/storage11_7T/fuy/TADA-A/annotation/pLI/auto/auto.annovar_cd_window_pli995_altA.bed", "/storage11_7T/fuy/TADA-A/annotation/pLI/auto/auto.annovar_cd_window_pli995_altC.bed", "/storage11_7T/fuy/TADA-A/annotation/pLI/auto/auto.annovar_cd_window_pli995_altG.bed", "/storage11_7T/fuy/TADA-A/annotation/pLI/auto/auto.annovar_cd_window_pli995_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/pLI/annovar_cd_window_pli05-995_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/annovar_cd_window_pli05-995_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/annovar_cd_window_pli05-995_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/annovar_cd_window_pli05-995_altT.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/pLI/annovar_cd_window_pli0-05_altA.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/annovar_cd_window_pli0-05_altC.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/annovar_cd_window_pli0-05_altG.bed", # "/storage11_7T/fuy/TADA-A/annotation/pLI/annovar_cd_window_pli0-05_altT.bed") , # c("/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex_public_noncommercial_v1_0.tab_alt_A_lower10pct.bed", # "/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex_public_noncommercial_v1_0.tab_alt_C_lower10pct.bed", # "/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex_public_noncommercial_v1_0.tab_alt_G_lower10pct.bed", # "/storage11_7T/fuy/TADA-A/db/MS_data/annota/spidex_public_noncommercial_v1_0.tab_alt_T_lower10pct.bed") , c("/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/auto/auto.A.cd.MPC2.annovar.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/auto/auto.C.cd.MPC2.annovar.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/auto/auto.G.cd.MPC2.annovar.bed", "/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/auto/auto.T.cd.MPC2.annovar.bed") # c("/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/A.cd.MPC12.annovar.bed", # "/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/C.cd.MPC12.annovar.bed", # "/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/G.cd.MPC12.annovar.bed", # "/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/T.cd.MPC12.annovar.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/A.cd.MPC01.annovar.bed", # "/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/C.cd.MPC01.annovar.bed", # "/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/G.cd.MPC01.annovar.bed", # "/storage11_7T/fuy/TADA-A/annotation/MPC_score/annovar/T.cd.MPC01.annovar.bed") , ############## # c("/storage11_7T/fuy/TADA-A/annotation/primateAI/chr_primateAI_exome_mutation_pathogen_rank_gt_80_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/primateAI/chr_primateAI_exome_mutation_pathogen_rank_gt_80_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/primateAI/chr_primateAI_exome_mutation_pathogen_rank_gt_80_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/primateAI/chr_primateAI_exome_mutation_pathogen_rank_gt_80_alt_T.bed") , # c("/storage11_7T/fuy/TADA-A/annotation/MVP/chr_MVP_all_rare_missense_pathogen_rank_gt_75_alt_A.bed", # "/storage11_7T/fuy/TADA-A/annotation/MVP/chr_MVP_all_rare_missense_pathogen_rank_gt_75_alt_C.bed", # "/storage11_7T/fuy/TADA-A/annotation/MVP/chr_MVP_all_rare_missense_pathogen_rank_gt_75_alt_G.bed", # "/storage11_7T/fuy/TADA-A/annotation/MVP/chr_MVP_all_rare_missense_pathogen_rank_gt_75_alt_T.bed") ),
report_proportion = 18665/18665, #chunk_partition_num =1, chunk = 2, node_n = 2, mutrate_ref_files = c("db/MS_data/mutrate/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_A.mutrate.bw", "db/MS_data/mutrate/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_C.mutrate.bw", "db/MS_data/mutrate/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_G.mutrate.bw", "db/MS_data/mutrate/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_T.mutrate.bw") # mutrate_ref_files = c("/storage11_7T/data.for.yuwen/new_mutrate/window.hg19.genome.tri2.alt_A.uq.bedGraph.sort.bw" , # "/storage11_7T/data.for.yuwen/new_mutrate/window.hg19.genome.tri2.alt_C.uq.bedGraph.sort.bw" , # "/storage11_7T/data.for.yuwen/new_mutrate/window.hg19.genome.tri2.alt_G.uq.bedGraph.sort.bw" , # "/storage11_7T/data.for.yuwen/new_mutrate/window.hg19.genome.tri2.alt_T.uq.bedGraph.sort.bw" )
))
saveRDS(compact_data,paste0("/storage11_7T/fuy/TADA-A/cell_WES/DNM/",Sys.Date(),"_12166DNM_6430_fam_auto_pli995_MPC2_1484_d_1630_compact.rds"))
|