单细胞-第四节 多样本数据分析,下游画图

文件在单细胞\5_GC_py\1_single_cell\2_plots.Rmd

1.细胞数量条形图

c 复制代码
rm(list = ls())
library(Seurat)
load("seu.obj.Rdata")

dat = as.data.frame(table(Idents(seu.obj)))
dat$label = paste(dat$Var1,dat$Freq,sep = ":")
head(dat)
library(ggplot2)
library(paletteer)
#View(palettes_d_names)
ggplot(dat,aes(x = Freq,fill = Var1,y = Var1))+
  scale_fill_paletteer_d("ggsci::category20_d3")+
  geom_bar(stat = "identity")+
  theme_bw()+
  geom_text(aes(x = 0,label = label),hjust = 0)+
  theme(axis.text.y = element_blank(),   # 隐藏纵坐标刻度文字
        axis.ticks.y = element_blank(),
        axis.title.y = element_blank())  # 隐藏纵坐标刻度线

2.细胞比例条形图

c 复制代码
seu.obj$seurat_annotation = seu.obj@active.ident
ggplot(seu.obj@meta.data,aes(orig.ident,fill = seurat_annotation))+
  geom_bar(position = "fill", alpha = 0.9,width = 0.5)+
  scale_fill_paletteer_d("ggsci::category20_d3")+
  theme_classic()+
  coord_flip()+
  coord_fixed(ratio = 4) #纵轴长度是横轴的4倍

3.小提琴图

c 复制代码
load("markers.Rdata")
library(tidyverse)
g = allmarkers %>% group_by(cluster) %>% top_n(1,wt = avg_log2FC) %>% pull(gene)

m = as.matrix(seu.obj@assays$RNA@layers$data)
rownames(m) = Features(seu.obj)
colnames(m) = Cells(seu.obj)
vln.df <- m %>%
  t() %>%
  as.data.frame()%>%
  select(g) %>% 
  rownames_to_column("CB") %>% 
  mutate(cluster = seu.obj$seurat_annotation)%>%
  pivot_longer(cols = 2:(ncol(.)-1),#宽边长
               names_to = "gene",
               values_to = "exp") %>% 
  mutate(gene = factor(gene,levels = g))
head(vln.df)
c 复制代码
# 自定义颜色
library(paletteer)
my_color = paletteer_d(`"ggsci::category20_d3"`)
my_color = colorRampPalette(my_color)(length(unique(vln.df$cluster)))
# 画图
p1 <- ggplot(vln.df,aes(exp,cluster),color=factor(cluster))+
  geom_violin(aes(fill=cluster),scale = "width")+
  scale_fill_manual(values = my_color)+
  facet_grid(.~gene,scales = "free_y", switch = "x")+
  scale_x_continuous(expand = c(0,0),position = "top")+
  theme_bw()+
  theme(
    panel.grid = element_blank(),
    axis.title.x.top = element_blank(),
    #axis.ticks.x.bottom = element_blank(),
    axis.text.x.top= element_text(hjust = 1,vjust = NULL,color = "black",size = 7),
    #axis.title.y.left = element_blank(),
    #axis.ticks.y.left = element_blank(),
    #axis.text.y.left = element_blank(),
    legend.position = "none",
    panel.spacing.y = unit(0, "cm"),
    strip.text.y = element_text(angle=0,size = 14,hjust = 0),
    strip.background.y = element_blank()
  )
p1

4.气泡图

c 复制代码
g = allmarkers %>% group_by(cluster) %>% top_n(5,wt = avg_log2FC) %>% pull(gene) %>% unique()
DotPlot(seu.obj,features = g,cols = "RdYlBu")+RotatedAxis()

5.GC基因韦恩图

c 复制代码
f = read.delim("gcgene.txt",header = F)
k = allmarkers$p_val_adj<0.05 & allmarkers$avg_log2FC>2
table(k)
g = intersect(allmarkers$gene[k],f$V1)
save(g,file = "g.Rdata")
library(tinyarray)
draw_venn(list(pyroptosis = f$V1,
               marker = unique(allmarkers$gene[k])),"")
ggsave("venn.png")
c 复制代码
m = as.matrix(seu.obj@assays$RNA@layers$data)
rownames(m) = Features(seu.obj)
colnames(m) = Cells(seu.obj)
m = m[g,]
ac = data.frame(row.names = colnames(m),
                celltype = Idents(seu.obj))
library(dplyr)
ac = arrange(ac,celltype)
m = m[,rownames(ac)]
pheatmap::pheatmap(m,show_colnames = F,cluster_cols = F,cluster_rows = F,scale = "row",breaks = seq(-1.6,3,length.out = 100),annotation_col = ac)

6.差异焦亡基因富集分析

c 复制代码
e = quick_enrich(g,destdir = tempdir())
e[[4]]+e[[3]]
相关推荐
纠结哥_Shrek4 小时前
基于最近邻数据进行分类
人工智能·分类·数据挖掘
Melancholy 啊5 小时前
细说机器学习算法之ROC曲线用于模型评估
人工智能·python·算法·机器学习·数据挖掘
一名技术极客6 小时前
Python 数据分析 - Matplotlib 绘图
python·数据分析·matplotlib
西农小陈7 小时前
Python-基于PyQt5,json和playsound的通用闹钟
开发语言·windows·python·pycharm·pyqt
AIGC大时代7 小时前
学术方向选则与规划DeepSeek、ChatGPT和Kimi对比
论文阅读·人工智能·chatgpt·数据分析·prompt
说私域11 小时前
对顾客行为的数据分析:融入2+1链动模式、AI智能名片与S2B2C商城小程序的新视角
人工智能·小程序·数据分析·开源
灰灰老师14 小时前
数据分析系列--②RapidMiner导入数据和存储过程
机器学习·ai·数据挖掘·数据分析·rapidminer
字节全栈_OYI15 小时前
在Windows中 基于Oracle GoldenGate (OGG)进行MySQL-&gt;MySQL数据库同步配置(超详细)_ogg-15146
数据库·windows·oracle
绒绒毛毛雨17 小时前
大数据挖掘--两个角度理解相似度计算理论
人工智能·数据挖掘