返回首页

使用python简单进行单细胞分析代码

1.绘制小提琴图 import scanpy as sc data=sc.read_10x_mtx(‘./input_data/text’,var_names=’gene_symbols’) #读取文件

sc.pp.filter_cells(data, min_genes=200)#最少200个基因表达,否则去除该细胞 sc.pp.filter_genes(data, min_cells=3)

data.var[‘mt’] = data.var_names.str.startswith(‘MT-‘) sc.pp.calculate_qc_metrics(data, qc_vars=[‘mt’], percent_top=None, log1p=False, inplace=True)

sc.pl.violin(data, [‘n_genes_by_counts’, ‘total_counts’, ‘pct_counts_mt’], jitter=0.4, multi_panel=True)

print(data)

2UMP降维

import scanpy as sc

data=sc.read_10x_mtx(‘./input_data/text’,var_names=’gene_symbols’) #读取文件

sc.pp.filter_cells(data, min_genes=200)#最少200个基因表达,否则去除该细胞 sc.pp.filter_genes(data, min_cells=3)

data.var[‘mt’] = data.var_names.str.startswith(‘MT-‘) #除去线粒体

sc.pp.normalize_total(data, target_sum=1e4) #数据标准化

sc.pp.log1p(data) #数据对数化

sc.pp.highly_variable_genes(data, min_mean=0.0125, max_mean=3, min_disp=0.5)

sc.tl.pca(data, svd_solver=’arpack’)

计算Computing the neighborhood graph

sc.pp.neighbors(data, n_neighbors=10, n_pcs=40) sc.tl.umap(data)

做出来的图跟教程有些差别

sc.pl.umap(data, color=[‘CST3’, ‘NKG7’, ‘PPBP’]) sc.pl.umap(data, color=[‘CST3’, ‘NKG7’, ‘PPBP’], use_raw=False)

Clustering the neighborhood graph。聚类并着色

这里需要安装pip3 install leidenalg

sc.tl.leiden(data) sc.pl.umap(data, color=[‘leiden’, ‘CST3’, ‘NKG7’])

3基因表达调控绘制 import scanpy as sc data=sc.read_10x_mtx(‘./input_data/text’,var_names=’gene_symbols’) #读取文件 sc.pl.highest_expr_genes(data, n_top=20, ) print(data)

4 线粒体基因和个基因占比 import scanpy as sc data=sc.read_10x_mtx(‘./input_data/text’,var_names=’gene_symbols’) #读取文件

sc.pp.filter_cells(data, min_genes=200)#最少200个基因表达,否则去除该细胞 sc.pp.filter_genes(data, min_cells=3)

data.var[‘mt’] = data.var_names.str.startswith(‘MT-‘) sc.pp.calculate_qc_metrics(data, qc_vars=[‘mt’], percent_top=None, log1p=False, inplace=True)

sc.pl.scatter(data, x=’total_counts’, y=’pct_counts_mt’) sc.pl.scatter(data, x=’total_counts’, y=’n_genes_by_counts’)

print(data) 5高峰表达与肘击图 import scanpy as sc

data=sc.read_10x_mtx(‘./input_data/text’,var_names=’gene_symbols’) #读取文件

sc.pp.filter_cells(data, min_genes=200)#最少200个基因表达,否则去除该细胞 sc.pp.filter_genes(data, min_cells=3)

data.var[‘mt’] = data.var_names.str.startswith(‘MT-‘) #除去线粒体

sc.pp.normalize_total(data, target_sum=1e4) #数据标准化

sc.pp.log1p(data) #数据对数化

sc.pp.highly_variable_genes(data, min_mean=0.0125, max_mean=3, min_disp=0.5) sc.pl.highly_variable_genes(data)

sc.tl.pca(data, svd_solver=’arpack’) sc.pl.pca(data, color=’CST3’) sc.pl.pca_variance_ratio(data, log=True)

print(data)

评论

0 条
暂无评论,来发表第一条评论吧