In [16]:
library(tadaA)
In [26]:
setwd("/project/wgs/analysis/TADA/TADA-A")
Adjust mutation rate¶
In [12]:
TADA_A_adjust_mutrate(window_file = 'test_data/test_windows.txt',
mut_file = 'test_data/test_simulated_DNM.bed',
genes = "all",sample_size = 5000,
mutrate_mode = "regular",
scaling_file_name = "test_data/test_simulated_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt",
scale_features = c("GC_content", "div_score"))
Read in DNM data, annotation data and mutation rate data¶
In [13]:
compact_data <- TADA_A_read_info(
mut_files = c("test_data/test_simulated_DNM_with_allele_info.txt"),
window_file = "test_data/test_windows.txt",
mutrate_scaling_files = c("test_data/test_simulated_windows_mutrate_with_div_score_scaling_file_for_test_DNM.txt"),
sample_sizes = c(5000),
gene_prior_file = "test_data/test_gene_prior.txt",
nonAS_noncoding_annotations = "test_data/test_non_allele_specific_annotation_1.bed",
AS_noncoding_annotations = NA,
report_proportion = 2000/18665,
chunk_partition_num =1,
node_n = 1,
mutrate_ref_files = c("test_data/test_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_A.mutrate.bw",
"test_data/test_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_C.mutrate.bw",
"test_data/test_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_G.mutrate.bw" ,
"test_data/test_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_T.mutrate.bw"))
Estimate relative risks¶
In [19]:
RR = TADA_A_RR_estimate(data = compact_data$base_info,
selected_annotations = c(1), gene_prior_file = "test_data/test_gene_prior.txt",
optimization_iteration = 2000)
In [20]:
RR
Bayesian FDR control¶
In [18]:
Bayesian_FDR(BF=c(seq(1,10)), pi0=0.05, alpha=0.05)
calculate the Bayes factor for each gene based on informative noncodng annotations¶
In [28]:
TADA_A_get_BFs(data = compact_data$base_info,
selected_annotations = c(1,3),
rr = RR$rr_report$relative_risk,
additional_BF_file = "test_data/test_additional_BF_file",
TADA_p0 = 0.94)
generate DNM¶
In [24]:
TADA_A_DNM_generator(window_file = "/project/wgs/analysis/TADA/MS_data/Example_windows.bed",
mutrate_scaling_files = c("/project/wgs/analysis/TADA/MS_data/Example_windows_mutrate_scaling_file_for_Yuen_NM2015_cases_DNM.txt","../data/Example_windows_mutrate_scaling_file_for_Kong_cases_DNM.txt", "../data/Example_windows_mutrate_scaling_file_for_Wu_cases_DNM.txt", "../data/Example_windows_mutrate_scaling_file_for_Jiang_cases_DNM.txt", "../data/Example_windows_mutrate_scaling_file_for_Michaelson_cases_DNM.txt"),
sample_sizes = c(162, 78, 32, 32, 10),
gene_prior_file = "/project/wgs/analysis/TADA/MS_data/Example_gene_prior.txt",
nonAS_noncoding_annotations = c("/project/wgs/analysis/TADA/MS_data/Noonan_brain_roadmap_union_within_10kb_and_promoter_no_utr.bed","../data/Epigenome_E081_E082_intersection__within_10kb_and_promoter_no_utr.bed","../data/Encode_DHS_union_within_10kb_and_promoter_no_utr.bed"),
AS_noncoding_annotations = NA,
report_proportion = 100/18665,
chunk_partition_num =1 ,
node_n = 6,
mutrate_ref_files = c("/project/wgs/analysis/TADA/MS_data/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_A.mutrate.bw",
"/project/wgs/analysis/TADA/MS_data/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_C.mutrate.bw",
"/project/wgs/analysis/TADA/MS_data/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_G.mutrate.bw",
"/project/wgs/analysis/TADA/MS_data/Example_windows_extended_1bp_for_getting_base_level_mutrate.bed.fasta.tri.alt_T.mutrate.bw"),
rr = c(1, 0, 0.5),
output_allele_info_files = "allele_info",
output_bed_files = "allele_bed",
output_risk_genes_file = "temp.riskgenes",
compact_mut_output = NA,
MPI = 1)
retrieve_mutation_info¶
In [ ]:
retrieve_mutation_info(data_partition, genename, noncoding_annotation)