{"doi":"10.1093/nar/gkr1178","title":"The NCBI Taxonomy database","abstract":"The NCBI Taxonomy database (http://www.ncbi.nlm.nih.gov/taxonomy) is the standard nomenclature and classification repository for the International Nucleotide Sequence Database Collaboration (INSDC), comprising the GenBank, ENA (EMBL) and DDBJ databases. It includes organism names and taxonomic lineages for each of the sequences represented in the INSDC's nucleotide and protein sequence databases. The taxonomy database is manually curated by a small group of scientists at the NCBI who use the current taxonomic literature to maintain a phylogenetic taxonomy for the source organisms represented in the sequence databases. The taxonomy database is a central organizing hub for many of the resources at the NCBI, and provides a means for clustering elements within other domains of NCBI web site, for internal linking between domains of the Entrez system and for linking out to taxon-specific external resources on the web. Our primary purpose is to index the domain of sequences as conveniently as possible for our user community.","journal":"Nucleic Acids Research","year":2011,"id":553,"datarank":25.453086410679823,"base_score":7.302496423727326,"endowment":7.302496423727326,"self_citation_contribution":1.095374463559099,"citation_network_contribution":24.357711947120723,"self_endowment_contribution":1.095374463559099,"citer_contribution":24.357711947120723,"corpus_percentile":98.53539462978031,"corpus_rank":19,"citation_count":1541,"citer_count":199,"citers_with_citation_signal":199,"citers_with_endowment":199,"datacite_reuse_total":0,"is_dataset":true,"is_dataset_confidence":0.9445,"is_oa":true,"file_count":0,"downloads":0,"has_version_chain":false,"published_date":"2011-12-01","fair_score":84.1667,"fair_percentile":99.7,"algorithm_id":"datarank_citation_only_1hop_v6","ranking_scope":"data_only","authors":[{"id":5656,"name":"Scott Federhen","orcid":null,"position":1,"is_corresponding":false},{"id":5655,"name":"S. Federhen","orcid":null,"position":0,"is_corresponding":true}],"reference_count":8,"raw_metadata":{"citation_network_status":"fetched"},"created_at":"2026-03-01T18:20:47.508186Z","pmid":"22139910","pmcid":"PMC3245000","fwci":null,"citation_percentile":null,"influential_citations":0,"oa_status":"gold","license":"cc-by-nc","views":0,"total_file_size_bytes":0,"version_count":0,"fair_f":100.0,"fair_a":70.0,"fair_i":100.0,"fair_r":66.6667,"fair_zscore":-0.2,"fair_rationale":{"fair_score":84.17,"has_llm":false,"dimensions":{"F":{"name":"Findable","score":100.0,"criteria":[{"key":"f_has_doi","label":"Has a persistent DOI","kind":"deterministic","weight":1.0,"fraction":1.0,"signal":"DOI present","rationale":null},{"key":"f_repository_presence","label":"Indexed in repositories / literature DBs","kind":"deterministic","weight":1.0,"fraction":1.0,"signal":"datacite=25, pmcid=True, pmid=True","rationale":null},{"key":"f_persistent_ids","label":"Resolvable scholarly identifiers (OpenAlex)","kind":"deterministic","weight":0.5,"fraction":1.0,"signal":"OpenAlex id present","rationale":null}]},"A":{"name":"Accessible","score":70.0,"criteria":[{"key":"a_open_access","label":"Open Access / files deposited","kind":"deterministic","weight":1.5,"fraction":0.5,"signal":"files/OA location present but not flagged OA","rationale":null},{"key":"a_retrievable","label":"Free full text retrievable","kind":"deterministic","weight":1.0,"fraction":1.0,"signal":"9 OA location(s)","rationale":null}]},"I":{"name":"Interoperable","score":100.0,"criteria":[{"key":"i_linked_data","label":"Linked datasets / DataCite relations","kind":"deterministic","weight":1.0,"fraction":1.0,"signal":"linked_datasets=25, datacite=25","rationale":null},{"key":"i_standard_ids","label":"References data via standard accessions","kind":"deterministic","weight":1.0,"fraction":1.0,"signal":"accessions=1, trials=0","rationale":null}]},"R":{"name":"Reusable","score":66.67,"criteria":[{"key":"r_license","label":"Clear, open reuse license","kind":"deterministic","weight":1.5,"fraction":1.0,"signal":"open license (cc-by-nc)","rationale":null},{"key":"r_downloads","label":"Demonstrated reuse (downloads)","kind":"deterministic","weight":0.5,"fraction":0.0,"signal":"downloads=0","rationale":null},{"key":"r_version","label":"Versioned / maintained","kind":"deterministic","weight":0.5,"fraction":0.0,"signal":"no version chain","rationale":null},{"key":"r_dataset","label":"Classified as a data resource","kind":"deterministic","weight":0.5,"fraction":1.0,"signal":"is_dataset","rationale":null}]}},"suggestions":["Maintain explicit versioning for the dataset.","Make the paper/data Open Access or deposit the files in an open repository."],"model":null,"agent_version":"fair_agent_v3","fulltext_source":"epmc_xml"},"fair_model":null,"fair_agent_version":"fair_agent_v3","fair_fulltext_source":"epmc_xml","fair_has_llm":false,"fair_computed_at":"2026-06-28T13:29:01.367410Z","clinical_trials":[],"software_tools":[],"db_accessions":[],"linked_datasets":[],"topics":[]}