Boxplot boxplot of the difference of HMR between Non-CMP and CMP group
# Data processing
n_hmr = rep(0, 100)
for(i in 1:length(sample_ids_wgbs)){
n_hmr[i] = length( hmr[[ sample_ids_wgbs[i] ]] )
m = match.idx( sample_ids_wgbs, samples_cmp )
is_cmp = rep(FALSE, 100)
gg = rep("non-CMP", 100)
gg[is_cmp] = "CMP"
df = data.frame( n_hmr/1000, groups=gg )
# Custom color
colors = rep('black',dim(df)[1])
colors[ df$groups=='CMP' ] = 'cornflowerblue'
# Grouping
df$groups = factor( df$groups, levels=c('non-CMP','CMP') )
# y value all column names
colname = colnames(df)[1]
test = wilcox.test(df[,colname]~df$groups)
# Drawing
plist = ggplot(df,aes_string(x='groups', y=colname))+
xlab('') + ylab( '' ) +
geom_boxplot( outlier.shape=NA) +
geom_jitter( size=1, position=position_jitter(height=0,width=.2), color=colors) +
theme_classic() +
scale_y_continuous(limits=c(0,100), breaks=seq(0,100,20), expand = c(0, 0))
# Calculate P value
# W = 1686, p-value = 5.756e-12
Zhao S G , Chen W S , Li H , et al. The DNA methylation landscape of advanced prostate cancer[J]. Nature Genetics, 2020.
Origial code