In [1]:
import pandas as pd
data = pd.read_excel('DEG_list.xlsx')
In [2]:
%get data
In [3]:
library(biomaRt)
ensembl <- useEnsembl(biomart='ensembl')
#listDatasets(ensembl)
ensembl <- useEnsembl(biomart="ensembl", dataset="mmusculus_gene_ensembl")
hgnc <- getBM(attributes=c('ensembl_gene_id', 'external_gene_name'),
filters = 'ensembl_gene_id', values = data['ensembl_gene_id'], mart = ensembl)
annotated <- merge(data, hgnc, by='ensembl_gene_id', all.x=TRUE)
In [4]:
%get annotated --from R
annotated = annotated.set_index('external_gene_name')
annotated.sort_values(by='padj', inplace=True)
annotated.to_excel('annotated_DEG_list.xlsx')