展开

单细胞数据集

最后发布时间 : 2023-01-11 11:54:35 浏览量 :

https://www.ncbi.nlm.nih.gov/geo/query/acc.cgi?acc=GSE60361

library(tidyverse)
library(Seurat)
library(Matrix)

exprMatrix <- read_delim("testData/singlecell/GSE60361_C1-3005-Expression.txt.gz")  |>
  distinct(cell_id, .keep_all = TRUE) |>
  column_to_rownames("cell_id")
exprMatrix[1:5,1:5]
# rownames(My_data) <- My_data[,1]
# My_data <- My_data[,-1]

Matx <- as.matrix(exprMatrix)
Matx <- as(Matx,"sparseMatrix")
seurat_ob <- CreateSeuratObject(counts = Matx)
seurat_ob@assays$RNA@counts[1:5,1:5]

monocle lung 数据

原始位置: monocle-release/R/utils.Rmonocle-release/inst/extdata/
测试数据: https://gitee.com/bioinfoFungi/monocle2/tree/master/monocle2_lung

表达矩阵

lung_exprs_data <- readr::read_tsv("https://gitee.com/bioinfoFungi/monocle2/raw/master/monocle2_lung/lung_exprs_data.tsv",show_col_types = FALSE) |>
    column_to_rownames("symbol")
lung_exprs_data[1:5,1:5]
#SRR1033854_0SRR1033855_0SRR1033856_0SRR1033859_0SRR1033860_0
ENSMUSG00000000031.900010.71002076650150
ENSMUSG00000000058.634.63543561439980028.2141740575583.18299366520609
ENSMUSG00000000184.90.1187055749246820.02673440129919810.0097928870844639700.653084159748841
ENSMUSG00000000216.80.4421152917880660.08804258877449260.1166162982123310.11777474071615212.2427903522189
ENSMUSG00000000402.243.460545212596243.88243860883983.332803336435490.8772126571585110

样本信息

lung_phenotype_data <- readr::read_tsv("https://gitee.com/bioinfoFungi/monocle2/raw/master/monocle2_lung/lung_phenotype_data.tsv",show_col_types = FALSE) |>
    column_to_rownames("sample")
lung_phenotype_data[1:5,1:5] 
#filetotal_massinternal_scaleexternal_scalemedian_transcript_frags
SRR1033854_0./quantification/SRR1033854_clout/abundances.cxb28402002.1687710.363568
SRR1033855_0./quantification/SRR1033855_clout/abundances.cxb29688304.2078210.00141841
SRR1033856_0./quantification/SRR1033856_clout/abundances.cxb33962106.1739310.403053
SRR1033859_0./quantification/SRR1033859_clout/abundances.cxb28460205.6210510.0318467
SRR1033860_0./quantification/SRR1033860_clout/abundances.cxb363642011.058410.00151798

基因信息

lung_feature_data <- readr::read_tsv("https://gitee.com/bioinfoFungi/monocle2/raw/master/monocle2_lung/lung_feature_data.tsv",show_col_types = FALSE) |>
    column_to_rownames("symbol")
lung_feature_data[1:5,1:5]
#class_codenearest_ref_idgene_idgene_short_nametss_id
ENSMUSG00000000031.9--ENSMUSG00000000031.9H19-
ENSMUSG00000000058.6--ENSMUSG00000000058.6Cav2-
ENSMUSG00000000184.9--ENSMUSG00000000184.9Ccnd2-
ENSMUSG00000000216.8--ENSMUSG00000000216.8Scnn1g-
ENSMUSG00000000402.2--ENSMUSG00000000402.2Egfl6-

monocle HSMM(human skeletal muscle myoblasts) 数据

原始位置:monocle-release/tests/testthat/test.plot_cell_clusters.RSingle-cell RNA-Seq for differentiating human skeletal muscle myoblasts (HSMM)

library(HSMMSingleCell)
data(HSMM_expr_matrix)
data(HSMM_gene_annotation)
data(HSMM_sample_sheet)