{"doi":"10.1007/s00335-015-9571-1","title":"A unified gene catalog for the laboratory mouse reference genome","abstract":null,"journal":"Mammalian Genome","year":2015,"id":16675,"datarank":0.6906986179699603,"base_score":3.091042453358316,"endowment":3.091042453358316,"self_citation_contribution":0.4636563680037475,"citation_network_contribution":0.2270422499662128,"self_endowment_contribution":0.4636563680037475,"citer_contribution":0.2270422499662128,"corpus_percentile":54.5,"corpus_rank":593,"citation_count":21,"citer_count":9,"citers_with_citation_signal":6,"citers_with_endowment":6,"datacite_reuse_total":0,"is_dataset":true,"is_dataset_confidence":null,"is_oa":false,"file_count":0,"downloads":0,"has_version_chain":false,"published_date":null,"fair_score":54.1667,"fair_percentile":80.05716798592788,"algorithm_id":"datarank_citation_only_1hop_v6","ranking_scope":"data_only","authors":[{"id":122231,"name":"J. E. Richardson","orcid":null,"position":1,"is_corresponding":false},{"id":122232,"name":"P. Hale","orcid":null,"position":2,"is_corresponding":false},{"id":122233,"name":"R. M. Baldarelli","orcid":null,"position":3,"is_corresponding":false},{"id":122234,"name":"D. J. Reed","orcid":null,"position":4,"is_corresponding":false},{"id":122235,"name":"J. M. Recla","orcid":null,"position":5,"is_corresponding":false},{"id":122236,"name":"R. Sinclair","orcid":null,"position":6,"is_corresponding":false},{"id":32463,"name":"T. B. K. Reddy","orcid":"0000-0002-0871-5567","position":7,"is_corresponding":false},{"id":122237,"name":"C. J. Bult","orcid":null,"position":8,"is_corresponding":false},{"id":10795,"name":"Y. Zhu","orcid":"0000-0001-7964-0091","position":0,"is_corresponding":false}],"reference_count":0,"raw_metadata":{"has_enrichment":true,"base_score":3.091042453358316,"endowment":3.091042453358316,"datacite_reuse_total":0,"file_count":0,"downloads":0,"views":0,"has_version_chain":false,"is_dataset":false,"is_oa":false,"pmid":"26084703","pmcid":"PMC4534496","openalex_id":"https://openalex.org/W1814949048","authors":[],"funders":[{"funder_name":"NCI NIH HHS","grant_id":"P30 CA034196","title":null},{"funder_name":"NHGRI NIH HHS","grant_id":"HG00330-P1","title":null},{"funder_name":"NHGRI NIH HHS","grant_id":"P41 HG000330","title":null},{"funder_name":"NHGRI NIH HHS","grant_id":"U41 HG000330","title":null}],"total_grants":4,"fwci":1.66,"citation_percentile":0.83318592,"influential_citations":0,"citation_trend":[{"year":2015,"count":2},{"year":2016,"count":6},{"year":2017,"count":1},{"year":2018,"count":2},{"year":2019,"count":2},{"year":2020,"count":2},{"year":2021,"count":4},{"year":2024,"count":1}],"oa_status":"hybrid","license":"cc-by","oa_locations":[{"url":"https://link.springer.com/content/pdf/10.1007/s00335-015-9571-1.pdf","host_type":"journal"},{"url":"https://link.springer.com/content/pdf/10.1007/s00335-015-9571-1.pdf","host_type":"HYBRID"},{"url":"https://link.springer.com/content/pdf/10.1007/s00335-015-9571-1.pdf","host_type":"publisher"},{"url":"http://link.springer.com/article/10.1007/s00335-015-9571-1/fulltext.html","host_type":"publisher"},{"url":"http://link.springer.com/content/pdf/10.1007/s00335-015-9571-1.pdf","host_type":"publisher"},{"url":"http://link.springer.com/content/pdf/10.1007/s00335-015-9571-1","host_type":"publisher"},{"url":"https://doi.org/10.1007/s00335-015-9571-1","host_type":"journal"},{"url":"https://pubmed.ncbi.nlm.nih.gov/26084703","host_type":"repository"},{"url":"https://www.ncbi.nlm.nih.gov/pmc/articles/4534496","host_type":"repository"},{"url":"https://mouseion.jax.org/stfb2015/140","host_type":"repository"},{"url":"https://europepmc.org/articles/PMC4534496","host_type":"Europe_PMC"},{"url":"https://europepmc.org/articles/PMC4534496?pdf=render","host_type":"Europe_PMC"}],"fields_of_study":["Genomics and Phylogenetic Studies","Gene expression and cancer classification","Molecular Biology Techniques and Applications","Medicine","Biology","Computer Science"],"mesh_terms":["Algorithms","Animals","Models, Genetic","Terminology as Topic","Pseudogenes","RNA","Software","Open Reading Frames","Genome","Internet","Genomics","Databases, Genetic","Mice","Molecular Sequence Annotation"],"keywords":["Ensembl","Genome","Annotation","Pseudogene","Gene Annotation","Genome project","Gene nomenclature","Biology","Genome browser","Computational biology","Gene prediction","Gene","Reference genome","Genomics","RefSeq","Genetics"],"sdg_mappings":[],"linked_datasets":[],"clinical_trials":[],"software_tools":[],"database_accessions":[{"name":"ensembl"}],"source":"live","citation_network_status":"fetched"},"created_at":"2026-06-02T12:31:42.963887Z","pmid":"26084703","pmcid":"PMC4534496","fwci":null,"citation_percentile":null,"influential_citations":0,"oa_status":"hybrid","license":"cc-by","views":0,"total_file_size_bytes":0,"version_count":0,"fair_f":65.0,"fair_a":72.5,"fair_i":37.5,"fair_r":41.6667,"fair_zscore":0.8101,"fair_rationale":{"fair_score":54.17,"has_llm":true,"dimensions":{"F":{"name":"Findable","score":65.0,"criteria":[{"key":"f_has_doi","label":"Has a persistent DOI","kind":"deterministic","weight":1.0,"fraction":1.0,"signal":"DOI present","rationale":null},{"key":"f_repository_presence","label":"Indexed in repositories / literature DBs","kind":"deterministic","weight":1.0,"fraction":1.0,"signal":"datacite=0, pmcid=True, pmid=True","rationale":null},{"key":"f_persistent_ids","label":"Resolvable scholarly identifiers (OpenAlex)","kind":"deterministic","weight":0.5,"fraction":0.0,"signal":"no OpenAlex id","rationale":null},{"key":"f_metadata_richness","label":"Rich, machine-readable metadata","kind":"llm","weight":1.0,"fraction":0.5,"signal":null,"rationale":"The paper describes the catalog and its contents but does not provide machine-readable metadata (e.g., structured JSON-LD, schema.org annotations) or a formal metadata record beyond the article itself."}]},"A":{"name":"Accessible","score":72.5,"criteria":[{"key":"a_open_access","label":"Open Access / files deposited","kind":"deterministic","weight":1.5,"fraction":0.5,"signal":"files/OA location present but not flagged OA","rationale":null},{"key":"a_retrievable","label":"Free full text retrievable","kind":"deterministic","weight":1.0,"fraction":1.0,"signal":"12 OA location(s)","rationale":null},{"key":"a_access_protocol","label":"Clear data/code access protocol","kind":"llm","weight":1.0,"fraction":0.75,"signal":null,"rationale":"The paper provides clear URLs for accessing the catalog (e.g., MGI database, FTP sites) and the fjoin code, but does not specify a formal access protocol (e.g., API, authentication requirements) or a persistent identifier like a DOI for the data."}]},"I":{"name":"Interoperable","score":37.5,"criteria":[{"key":"i_linked_data","label":"Linked datasets / DataCite relations","kind":"deterministic","weight":1.0,"fraction":0.0,"signal":"linked_datasets=0, datacite=0","rationale":null},{"key":"i_standard_ids","label":"References data via standard accessions","kind":"deterministic","weight":1.0,"fraction":0.0,"signal":"accessions=0, trials=0","rationale":null},{"key":"i_standards","label":"Standard formats, vocabularies & identifiers","kind":"llm","weight":1.0,"fraction":0.75,"signal":null,"rationale":"The paper uses standard formats (GFF3, tab-delimited) and references Sequence Ontology terms, but does not demonstrate use of community-standard identifiers for all features (e.g., no mention of using identifiers.org or equivalent resolvable IDs)."}]},"R":{"name":"Reusable","score":41.67,"criteria":[{"key":"r_license","label":"Clear, open reuse license","kind":"deterministic","weight":1.5,"fraction":0.0,"signal":"no license","rationale":null},{"key":"r_downloads","label":"Demonstrated reuse (downloads)","kind":"deterministic","weight":0.5,"fraction":0.0,"signal":"downloads=0","rationale":null},{"key":"r_version","label":"Versioned / maintained","kind":"deterministic","weight":0.5,"fraction":0.0,"signal":"no version chain","rationale":null},{"key":"r_dataset","label":"Classified as a data resource","kind":"deterministic","weight":0.5,"fraction":1.0,"signal":"is_dataset","rationale":null},{"key":"r_reusability","label":"Data-availability statement, license & reproducibility","kind":"llm","weight":2.0,"fraction":0.667,"signal":null,"rationale":"The paper includes a data-availability statement with download links and a CC BY license, but lacks explicit reproducibility details (e.g., exact software versions, parameter files) and does not provide a formal data citation or persistent identifier for the catalog version."}]}},"suggestions":["Add machine-readable metadata (e.g., JSON-LD with schema.org/Dataset) to the paper and data repository to improve findability.","Assign a persistent identifier (e.g., DOI) to each version of the unified gene catalog and include it in the paper.","Provide a formal API or SPARQL endpoint for programmatic access to the catalog, with documentation.","Use resolvable identifiers (e.g., identifiers.org URIs) for all genome features and biotypes to enhance interoperability.","Include a reproducibility package with exact software versions, configuration files, and input data versions in a public repository."],"model":"deepseek/deepseek-v4-flash","agent_version":"fair_agent_v2","fulltext_source":"epmc_xml"},"fair_model":"deepseek/deepseek-v4-flash","fair_agent_version":"fair_agent_v2","fair_fulltext_source":"epmc_xml","fair_has_llm":true,"fair_computed_at":"2026-06-18T00:47:23.714523Z","clinical_trials":[],"software_tools":[],"db_accessions":[],"linked_datasets":[],"topics":[]}