Dear all.
I have perform differential expression analysis using Deseq2 and tximport from rsem data.
When I try to map gene symbol I have some symbol are not annotated. This is some informtion on my code and my version of tools.
library( "biomaRt" ) #ensembl = useMart( "ensembl", dataset = "hsapiens_gene_ensembl" ) ensembl = useMart( host="dec2013.archive.ensembl.org",biomart="ENSEMBL_MART_ENSEMBL", dataset = "hsapiens_gene_ensembl" ) genemap <- getBM( attributes = c("ensembl_gene_id", "entrezgene", "hgnc_symbol","band","chromosome_name"), filters = "ensembl_gene_id", values = list(res$ensembl,"protein_coding"), mart = ensembl ) idx <- match( res$ensembl, genemap$ensembl_gene_id ) res$entrez <- genemap$entrezgene[ idx ] res$hgnc_symbol <- genemap$hgnc_symbol[ idx ] table(res$hgnc_symbol=="HDGFRP2") FALSE 57905 > table(res$hgnc_symbol=="FUS") FALSE TRUE 57904 1 > table(res$hgnc_symbol=="DDIT3") FALSE TRUE 57904 1 > table(res$ensembl=="ENSG00000167674") FALSE TRUE 57904 1 > table(res$ensembl=="ENSG00000167674") FALSE TRUE 57904 1 > sessionInfo() R version 3.3.2 (2016-10-31) Platform: x86_64-pc-linux-gnu (64-bit) Running under: Ubuntu 16.04.2 LTS locale: [1] LC_CTYPE=en_US.UTF-8 LC_NUMERIC=C LC_TIME=it_IT.UTF-8 [4] LC_COLLATE=en_US.UTF-8 LC_MONETARY=it_IT.UTF-8 LC_MESSAGES=en_US.UTF-8 [7] LC_PAPER=it_IT.UTF-8 LC_NAME=C LC_ADDRESS=C [10] LC_TELEPHONE=C LC_MEASUREMENT=it_IT.UTF-8 LC_IDENTIFICATION=C attached base packages: [1] parallel stats4 stats graphics grDevices utils datasets methods base other attached packages: [1] biomaRt_2.28.0 ggplot2_2.2.1 genefilter_1.54.2 [4] pheatmap_1.0.8 tximportData_1.0.2 tximport_1.0.3 [7] DESeq2_1.12.4 SummarizedExperiment_1.2.3 Biobase_2.32.0 [10] GenomicRanges_1.24.3 GenomeInfoDb_1.8.7 IRanges_2.6.1 [13] S4Vectors_0.10.3 BiocGenerics_0.18.0 loaded via a namespace (and not attached): [1] locfit_1.5-9.1 splines_3.3.2 lattice_0.20-35 colorspace_1.3-2 [5] htmltools_0.3.5 base64enc_0.1-3 survival_2.40-1 XML_3.98-1.5 [9] foreign_0.8-67 DBI_0.6-1 BiocParallel_1.6.6 RColorBrewer_1.1-2 [13] plyr_1.8.4 stringr_1.2.0 zlibbioc_1.18.0 munsell_0.4.3 [17] gtable_0.2.0 htmlwidgets_0.8 memoise_1.0.0 labeling_0.3 [21] latticeExtra_0.6-28 knitr_1.15.1 geneplotter_1.50.0 AnnotationDbi_1.34.4 [25] htmlTable_1.9 Rcpp_0.12.9 acepack_1.4.1 xtable_1.8-2 [29] backports_1.0.5 scales_0.4.1 checkmate_1.8.2 Hmisc_4.0-2 [33] annotate_1.50.1 XVector_0.12.1 gridExtra_2.2.1 digest_0.6.12 [37] stringi_1.1.2 grid_3.3.2 tools_3.3.2 bitops_1.0-6 [41] magrittr_1.5 lazyeval_0.2.0 RCurl_1.95-4.8 tibble_1.2 [45] RSQLite_1.1-2 Formula_1.2-1 cluster_2.0.6 Matrix_1.2-8 [49] data.table_1.10.0 assertthat_0.1 rpart_4.1-10 nnet_7.3-12