From 71233261d20b566c86a539101a77281ee16508df Mon Sep 17 00:00:00 2001 From: "Vera N. Karlbauer" <vera@karlbauer.org> Date: Tue, 13 Aug 2024 18:05:00 +0200 Subject: [PATCH] Replaced all RGSets with gRatioSets --- scripts/6_filtering_cpgs.Rmd | 37 +++++++++++++++++++----------------- 1 file changed, 20 insertions(+), 17 deletions(-) diff --git a/scripts/6_filtering_cpgs.Rmd b/scripts/6_filtering_cpgs.Rmd index e0870b2..db4c677 100644 --- a/scripts/6_filtering_cpgs.Rmd +++ b/scripts/6_filtering_cpgs.Rmd @@ -105,9 +105,10 @@ if (user_choices$array_type == "v2") { filter(CpG_name %in% replicates$CpG_name) %>% filter(!(IlmnID %in% keep_replicates$IlmnID)) - # exclude replicates from betas, RGSet, detP and save data - RGSet_clean <- subsetByLoci(RGSet_clean, excludeLoci = exclude_replicates$IlmnID) - save(RGSet_clean, file = paste0(user_choices$project_name, "/processed_data/RGSet_clean.Rdata")) + # exclude replicates from betas, gRatioSet, detP and save data + keep_gratioset <- !(featureNames(gRatioSet_clean) %in% exclude_replicates$IlmnID) + gRatioSet_clean <- gRatioSet_clean[keep_gratioset,] + save(gRatioSet_clean, file = paste0(user_choices$project_name, "/processed_data/gRatioSet_clean.Rdata")) keep_betas <- !(rownames(Betas_clean) %in% exclude_replicates$IlmnID) Betas_clean <- Betas_clean[keep_betas,] @@ -126,13 +127,13 @@ if (user_choices$array_type == "v2") { keep_betas_df <- as.data.frame(keep_betas) cat(paste0(nrow(exclude_replicates), " replicate probes were removed")) - dim_RGSet_filtered <- dim(RGSet_clean) + dim_gRatioSet_filtered <- dim(gRatioSet_clean) dim_Betas_filtered <- dim(Betas_clean) step_number <- c("4", "4") step <- c("Filter replicates", "Filter replicates") - data_class <- c("RGSet", "Betas") - samples <- c(dim_RGSet_filtered[2], dim_Betas_filtered[2]) - probes <- c(dim_RGSet_filtered[1], dim_Betas_filtered[1]) + data_class <- c("gRatioSet", "Betas") + samples <- c(dim_gRatioSet_filtered[2], dim_Betas_filtered[2]) + probes <- c(dim_gRatioSet_filtered[1], dim_Betas_filtered[1]) table_preprocessing_adding <- data.frame(step_number, step, data_class, samples, probes) summary_table_preprocessing <- bind_rows(summary_table_preprocessing, table_preprocessing_adding) @@ -371,7 +372,8 @@ if (user_choices$array_type == "v2") { keep_betas <- !(rownames(Betas_clean_filtered) %in% v2_mapping_inacc$IlmnID) Betas_clean_filtered <- Betas_clean_filtered[keep_betas,] - RGSet_clean_filtered <- subsetByLoci(RGSet_clean_filtered, excludeLoci = v2_mapping_inacc$IlmnID) + keep_gratioset <- !(featureNames(gRatioSet_clean_filtered) %in% v2_mapping_inacc$IlmnID) + gRatioSet_clean_filtered <- gRatioSet_clean_filtered[keep_gratioset,] } ``` @@ -381,13 +383,13 @@ if (user_choices$array_type == "v2") { cat(paste0(keep_betas_df %>% filter(keep_betas == FALSE) %>% nrow(), " CpGs show known mapping inaccuracies"), sep = "<br>\n") - dim_RGSet_filtered <- dim(RGSet_clean_filtered) + dim_gRatioSet_filtered <- dim(gRatioSet_clean_filtered) dim_Betas_filtered <- dim(Betas_clean_filtered) step_number <- c("12", "12") step <- c("Filter Mapping Inaccuracies", "Filter Mapping Inaccuracies") - data_class <- c("RGSet", "Betas") - samples <- c(dim_RGSet_filtered[2], dim_Betas_filtered[2]) - probes <- c(dim_RGSet_filtered[1], dim_Betas_filtered[1]) + data_class <- c("gRatioSet", "Betas") + samples <- c(dim_gRatioSet_filtered[2], dim_Betas_filtered[2]) + probes <- c(dim_gRatioSet_filtered[1], dim_Betas_filtered[1]) table_preprocessing_adding <- data.frame(step_number, step, data_class, samples, probes) summary_table_preprocessing <- bind_rows(summary_table_preprocessing, table_preprocessing_adding) @@ -401,7 +403,8 @@ if (user_choices$array_type == "v2") { keep_betas <- !(rownames(Betas_clean_filtered) %in% v2_flagged_probes$IlmnID) Betas_clean_filtered <- Betas_clean_filtered[keep_betas,] - RGSet_clean_filtered <- subsetByLoci(RGSet_clean_filtered, excludeLoci = v2_flagged_probes$IlmnID) + keep_gratioset <- !(featureNames(gRatioSet_clean_filtered) %in% v2_flagged_probes$IlmnID) + gRatioSet_clean_filtered <- gRatioSet_clean_filtered[keep_gratioset,] } ``` @@ -411,13 +414,13 @@ if (user_choices$array_type == "v2") { cat(paste0(keep_betas_df %>% filter(keep_betas == FALSE) %>% nrow(), " CpGs were flagged by Illumina"), sep = "<br>\n") - dim_RGSet_filtered <- dim(RGSet_clean_filtered) + dim_gRatioSet_filtered <- dim(gRatioSet_clean_filtered) dim_Betas_filtered <- dim(Betas_clean_filtered) step_number <- c("13", "13") step <- c("Filter Flagged Probes", "Filter Flagged Probes") - data_class <- c("RGSet", "Betas") - samples <- c(dim_RGSet_filtered[2], dim_Betas_filtered[2]) - probes <- c(dim_RGSet_filtered[1], dim_Betas_filtered[1]) + data_class <- c("gRatioSet", "Betas") + samples <- c(dim_gRatioSet_filtered[2], dim_Betas_filtered[2]) + probes <- c(dim_gRatioSet_filtered[1], dim_Betas_filtered[1]) table_preprocessing_adding <- data.frame(step_number, step, data_class, samples, probes) summary_table_preprocessing <- bind_rows(summary_table_preprocessing, table_preprocessing_adding)