Simplify and fix summary stats
This commit is contained in:
@@ -156,7 +156,7 @@ update_gene_names <- function(df, sgd_gene_list) {
|
|||||||
}
|
}
|
||||||
|
|
||||||
calculate_summary_stats <- function(df, variables, group_vars = c("OrfRep", "conc_num", "conc_num_factor")) {
|
calculate_summary_stats <- function(df, variables, group_vars = c("OrfRep", "conc_num", "conc_num_factor")) {
|
||||||
# Summarize the variables within the grouped data
|
|
||||||
summary_stats <- df %>%
|
summary_stats <- df %>%
|
||||||
group_by(across(all_of(group_vars))) %>%
|
group_by(across(all_of(group_vars))) %>%
|
||||||
summarise(
|
summarise(
|
||||||
@@ -172,11 +172,10 @@ calculate_summary_stats <- function(df, variables, group_vars = c("OrfRep", "con
|
|||||||
)
|
)
|
||||||
|
|
||||||
# Create a cleaned version of df that doesn't overlap with summary_stats
|
# Create a cleaned version of df that doesn't overlap with summary_stats
|
||||||
cols_to_exclude <- unique(c(variables, group_vars))
|
cols_to_keep <- setdiff(names(df), names(summary_stats)[-which(names(summary_stats) %in% group_vars)])
|
||||||
df_cleaned <- df %>%
|
df_cleaned <- df %>%
|
||||||
select(-any_of(cols_to_exclude))
|
select(all_of(cols_to_keep))
|
||||||
|
|
||||||
# Join the stats back to the original dataframe
|
|
||||||
df_with_stats <- left_join(df_cleaned, summary_stats, by = group_vars)
|
df_with_stats <- left_join(df_cleaned, summary_stats, by = group_vars)
|
||||||
|
|
||||||
return(list(summary_stats = summary_stats, df_with_stats = df_with_stats))
|
return(list(summary_stats = summary_stats, df_with_stats = df_with_stats))
|
||||||
|
|||||||
Reference in New Issue
Block a user