Skip to content

Commit

Permalink
added missing entrez identifiers
Browse files Browse the repository at this point in the history
  • Loading branch information
sigven committed Aug 29, 2024
1 parent 3b24a9f commit 19d6cde
Show file tree
Hide file tree
Showing 3 changed files with 24 additions and 5 deletions.
7 changes: 4 additions & 3 deletions NEWS.md
Original file line number Diff line number Diff line change
@@ -1,7 +1,8 @@
# Version 0.9.5
# Version 0.9.6

- fix bug in Entrez gene identifiers (grch37)
- fix bug in HGNC id map (grch38)
- fixed bug in Entrez gene identifiers (grch37)
- fixed bug in HGNC id map (grch38)
- added missing Entrez gene identifiers (grch37/grch38)

# Version 0.9.2

Expand Down
Binary file modified R/sysdata.rda
Binary file not shown.
22 changes: 20 additions & 2 deletions data-raw/utils_gencode_annotation.R
Original file line number Diff line number Diff line change
Expand Up @@ -1157,9 +1157,27 @@ biomart_ensg2entrez <- function(build = "grch37",
"entrezgene" = "entrezgene")) |>
dplyr::anti_join(mappings_in_gene_info, by = "ensembl_gene_id")

return(dplyr::bind_rows(
tmp_mappings <- dplyr::bind_rows(
mappings_in_gene_info,
other_mappings))
other_mappings)

other_mappings2 <- gene_info |>
dplyr::mutate(entrezgene = as.character(entrezgene)) |>
dplyr::select(hgnc_id, ensembl_gene_id, name, entrezgene) |>
dplyr::rename(description = name) |>
dplyr::anti_join(tmp_mappings,
by = c("entrezgene" = "entrezgene")) |>
dplyr::filter(!is.na(ensembl_gene_id))

tmp_mappings <- tmp_mappings |>
dplyr::anti_join(
dplyr::select(other_mappings2, ensembl_gene_id),
by = "ensembl_gene_id")


return(dplyr::bind_rows(
tmp_mappings,
other_mappings2))

}

Expand Down

0 comments on commit 19d6cde

Please sign in to comment.