data:image/s3,"s3://crabby-images/b818f/b818fa30f4ffba0590b1efe4f4b148f375ee7763" alt=""
本期教程
data:image/s3,"s3://crabby-images/179ac/179acd848aff46bd9e8f5a13db4a858cfa973082" alt=""
「小杜的生信笔记」,自2021年11月开始做的知识分享,主要内容是「R语言绘图教程」、「转录组上游分析」、**「转录组下游分析」**等内容。凡事在社群同学,可免费获得自2021年11月份至今全部教程,教程配备事例数据和相关代码,我们会持续更新中。
往期教程部分内容
data:image/s3,"s3://crabby-images/59008/59008f0bc74f2e08341411e36858f0f4d58fca0d" alt=""
data:image/s3,"s3://crabby-images/ea874/ea8741584616ca944bbd67460358363715fb64fe" alt=""
data:image/s3,"s3://crabby-images/110d7/110d73f09258914f751e556a2490021367624e9b" alt=""
data:image/s3,"s3://crabby-images/f5f8f/f5f8fd3df2eb182fedd521f849e252e04d5fcafe" alt=""
data:image/s3,"s3://crabby-images/936e9/936e993ffd6a78c19ec837ad5059fae014cb082e" alt=""
data:image/s3,"s3://crabby-images/fbf67/fbf67f2028a462f8ecea038c3771343a24a35e5a" alt=""
data:image/s3,"s3://crabby-images/a0826/a082670e720e1ec1ec305224ea0e5c9ea1c60f65" alt=""
data:image/s3,"s3://crabby-images/c6dd1/c6dd109b0342cf538c0688815213be8826c2f347" alt=""
data:image/s3,"s3://crabby-images/a5614/a561445ee338e614124e0c413f74f5df741e4828" alt=""
data:image/s3,"s3://crabby-images/247bf/247bf174b6fbfc206e3e7a8b6bbbbd01b49dae27" alt=""
data:image/s3,"s3://crabby-images/97922/979228c9a60861313f217d326954051616eb0adb" alt=""
data:image/s3,"s3://crabby-images/2c295/2c295cebccf45e61e5ae702f6441baa872bc523f" alt=""
数据处理
有N个数据需要进行处理,每个文件中有N个文件,如下所示。需进行批量处理数据。
data:image/s3,"s3://crabby-images/887da/887da57fdf32cde34f1534f419a835a42e669894" alt=""
data:image/s3,"s3://crabby-images/b08ee/b08ee24722c17f4250e0df40be97b70705cd37c3" alt=""
加载R包
setwd("D:\\BioinfoFile\\小杜的生信笔记\\2024\\20240511_分析手稿中IFN治疗的成像数据")
##'@导入所需R包
library('stringr')
library('tidyverse')
library('ggplot2')
创建分析文件夹
dir.create(file.path(".","figure"),showWarnings = TRUE)
dir.create(file.path(".","result"),showWarnings = TRUE)
加载数据及提取
base_path = "./ifn_treatment/"
replicates = list.files(base_path,"exp.*")
data.ifn = NULL
# For each replicate experiment
for( replicate in replicates ){
data.rep = NULL# data.frame with measurement for one replicate
replicate_path = paste(base_path,replicate,"/",sep="")
files_list = list.files(replicate_path,".*red_quant.csv")
# For each sample within a replicate experiment
for( file_name in files_list ){
well_id = str_extract(file_name,"W\\d+")
fv_id = str_extract(file_name,"F\\d+")
data_red = read.csv(paste(replicate_path,file_name,sep=""),sep=",",row.names=1)
data_green = read.csv(paste(replicate_path,gsub("red","green",file_name),sep=""),sep=",",row.names=1)
data = merge(data_red, data_green, by="row.names",suffix=c("_red","_green"))
data$cell_id = paste(data$Row.names)
data$well_id = well_id
data$fv_id = fv_id
data$replicate = replicate
data$Row.names = NULL
data = data[,c("well_id","fv_id","cell_id","replicate","Area_red","Mean_red","Median_red","Mean_green","Median_green")]
if(is.null(data.rep)){
data.rep = data
} else {
data.rep = rbind(data.rep,data)
}
}
#retrieve experimental design
exp_design = read.csv(paste(replicate_path,"experimental_design.csv",sep=""),sep=","); exp_design$cell_num = as.factor(exp_design$cell_num);
#merge results table with experimental design
data_m = as_tibble(merge(data.rep, exp_design, by.x="well_id", by.y="well"))
#merge table with previous replicates
if(is.null(data.ifn)){
data.ifn = data_m
} else {
data.ifn = rbind(data.ifn, data_m)
}
}
### Quality control
str(data.ifn)
summary(data.ifn)
dim(data.ifn)
data:image/s3,"s3://crabby-images/56dcb/56dcbf3360ac06948cef046e83dd17b89629ea9a" alt=""
保存数据
write.csv(data.ifn,"./result/data.ifn.output.csv")
绘图
- 绘制直方堆积图
ggplot(data.ifn %>%
mutate(group = paste(cell_line,"_",cell_num,sep="")),
aes(x=Median_red, fill=group))+
geom_histogram(color = "white", alpha = 0.5, position = "identity")+
scale_x_log10()+ ##'@X轴进行log10()处理
facet_wrap(~ replicate)
2. 散点图
ggplot(data.ifn, aes(x=Median_red, y=Area_red) ) +
geom_bin2d(bins = 70) +
facet_wrap(~ cell_line+replicate) +
scale_x_log10() +
scale_y_log10() +
theme_bw()
data:image/s3,"s3://crabby-images/189cc/189ccad3ae30f7566c162d0327cd9ca17c365117" alt=""
若我们的教程对你有所帮助,请点赞+收藏+转发,这是对我们最大的支持。
往期部分文章
「1. 最全WGCNA教程(替换数据即可出全部结果与图形)」
「2. 精美图形绘制教程」
「3. 转录组分析教程」
「4. 转录组下游分析」
「小杜的生信筆記」 ,主要发表或收录生物信息学教程,以及基于R分析和可视化(包括数据分析,图形绘制等);分享感兴趣的文献和学习资料!!