Last updated: 2019-01-01

Data loading and inspection of the metadata.

                      nGene    nUMI    orig.ident                  cell
A12.D041914.3_8_M.1.1  4712 1221663 SeuratProject A12.D041914.3_8_M.1.1
B16.D041914.3_8_M.1.1  3652 1837897 SeuratProject B16.D041914.3_8_M.1.1
C18.D041914.3_8_M.1.1  6220 1703523 SeuratProject C18.D041914.3_8_M.1.1
D22.D041914.3_8_M.1.1  5322  949162 SeuratProject D22.D041914.3_8_M.1.1
F4.D041914.3_8_M.1.1   3036   59975 SeuratProject  F4.D041914.3_8_M.1.1
C19.D041914.3_8_M.1.1  5350  808935 SeuratProject C19.D041914.3_8_M.1.1
                       tissue cell_ontology_class cell_ontology_id
A12.D041914.3_8_M.1.1 Bladder    mesenchymal cell       CL:0008019
B16.D041914.3_8_M.1.1 Bladder        bladder cell       CL:1001319
C18.D041914.3_8_M.1.1 Bladder        bladder cell       CL:1001319
D22.D041914.3_8_M.1.1 Bladder        bladder cell       CL:1001319
F4.D041914.3_8_M.1.1  Bladder    mesenchymal cell       CL:0008019
C19.D041914.3_8_M.1.1 Bladder        bladder cell       CL:1001319
A12.D041914.3_8_M.1.1 Bladder_mesenchymal cell
B16.D041914.3_8_M.1.1     Bladder_bladder cell
C18.D041914.3_8_M.1.1     Bladder_bladder cell
D22.D041914.3_8_M.1.1     Bladder_bladder cell
F4.D041914.3_8_M.1.1  Bladder_mesenchymal cell
C19.D041914.3_8_M.1.1     Bladder_bladder cell
sce_maca <- as.SingleCellExperiment(seurat_obj)
all10x <- readRDS('output/10x-180504')
sce_10x <- as.SingleCellExperiment(all10x)

#convert maca gene names to uppercase to match 10x gene names
rowData(sce_maca)['feature_symbol'] <- unlist(lapply(rowData(sce_maca)$gene, function(x){return(toupper(x))}))
rowData(sce_10x)['feature_symbol'] <- rowData(sce_10x)$gene

counts(sce_10x) <- as.matrix(counts(sce_10x))
logcounts(sce_10x) <- as.matrix(logcounts(sce_10x))

counts(sce_maca) <- as.matrix(counts(sce_maca))
logcounts(sce_maca) <- as.matrix(logcounts(sce_maca))
sce_maca <- selectFeatures(sce_maca, suppress_plot = FALSE)

Celltypes in the fat dataset %>% filter(tissue=="Fat") %>% distinct(tissue_cell_type)
1                      Fat_myeloid cell
2                            Fat_T cell
3                            Fat_B cell
4                       Fat_granulocyte
5  Fat_mesenchymal stem cell of adipose
6                  Fat_endothelial cell
7               Fat_natural killer cell
8                   Fat_epithelial cell
9                        Fat_neutrophil
10               Fat_smooth muscle cell

Subsetting and preparing the data.

maca_fat <- SubsetData(SetAllIdent(seurat_obj, id='tissue'), ident.use="Fat")
sce_maca_fat <- as.SingleCellExperiment(maca_fat)
rowData(sce_maca_fat)['feature_symbol'] <- unlist(lapply(rowData(sce_maca_fat)$gene, function(x){return(toupper(x))}))
counts(sce_maca_fat) <- as.matrix(counts(sce_maca_fat))
logcounts(sce_maca_fat) <- as.matrix(logcounts(sce_maca_fat))
sce_maca_fat <- selectFeatures(sce_maca_fat, suppress_plot = FALSE)

Setting the right column for clustering.

sce_maca_fat <- indexCluster(sce_maca_fat, cluster_col = 'cell_ontology_class')

Predicting cell types in our dataset.

scmapCluster_results_fat <- scmapCluster(
  projection = sce_10x, 
  index_list = list(
    sce_maca_fat = metadata(sce_maca_fat)$scmap_cluster_index
  threshold=0.5  #default=0.7 
Warning in setFeatures(projection, rownames(index)): Features
1190002H23RIK, 8430408G22RIK, ADH1, AW112010, C1RA, C4B, CAR4, CCL6,
CCL9, CCR2, CD2, CD24A, CD48, CD53, CXCR7, CYB5, CYBB, CYP4B1, CYP4F18,
ERCC-00009, ERCC-00108, F13A1, FCGR2B, FCGR3, GIMAP3, GIMAP6, GM11428,
GPIHBP1, H2-AA, H2-AB1, H2-D1, H2-DMA, H2-DMB1, H2-DMB2, H2-EB1, H2-K1, H2-
OB, H2-Q6, HMGCS2, IFI205, IFI27L2A, IL11RA1, LILRB4, LRRC33, LY6A, LY6C1,
LY86, LYZ2, MGL2, MMP23, MRC1, MS4A1, MS4A4B, MS4A4C, MS4A4D, MS4A6B,
TPRGL, TRF are not present in the 'SCESet' object and therefore were not

Number of predictions for each annotation for the whole dataset and for the mixture cluster.

pred_fat <-$scmap_cluster_labs))
pred_fat <- pred_fat[order(-pred_fat$Freq),]

pred_mixt_fat <-$scmap_cluster_labs[which(colData(sce_10x)$res.0.5 %in% 12), 'sce_maca_fat']))

scmap_nr_predictions <- merge(pred_fat, pred_mixt_fat, by='Var1', suffixes=c('.total', '.mixture'))
                              Var1 Freq.mixture
1                  epithelial cell        861          723
2 mesenchymal stem cell of adipose      43909           78
3               smooth muscle cell        749           18
4                       unassigned      10852          320

Interestingly, a lot of epithelial cell predictions in the mixture cluster and not that much mesenchymal stem cell predictions.

predicted_labels_fat <-
names(predicted_labels_fat) <- 'predicted_labels_fat'
all10x <- AddMetaData(all10x, metadata=predicted_labels_fat,'predicted_labels_fat')
t1 <- TSNEPlot(all10x,'predicted_labels_fat', pt.size=0.1)

save_plot("/projects/pytrik/sc_adipose/analyze_10x_fluidigm/data/plots_slides/scmap.pdf", t1, base_width=8, base_height = 5)
TSNEPlot(all10x,'sample_name', pt.size=0.1, do.label=T)

#saveRDS(all10x, 'output/10x-180504')
write.table(scmap_nr_predictions, 'tables/10x-180504-scmap-numbers')

