{"doi":"10.1038/s41597-026-06742-1","title":"Human gut archaea collection from Estonian population","abstract":"While microbiota plays a crucial role in maintaining overall health, archaea, a component of microbiota, remain relatively unexplored. Here, we present a newly assembled set of archaeal metagenome-assembled genomes (MAGs) from 1,878 fecal microbiome samples. These MAGs were reconstructed from metagenomic reads of the Estonian Microbiome Deep (EstMB-deep) cohort, which were reused here specifically for archaeal MAG reconstruction. We identified 273 archaeal MAGs, representing 21 species and 144 strains which we curated into the \"EstMB MAGdb Archaea-273\" MAGs collection.","journal":"Scientific Data","year":2026,"id":8082,"datarank":0.0,"base_score":0.0,"endowment":0.0,"self_citation_contribution":0.0,"citation_network_contribution":0.0,"self_endowment_contribution":0.0,"citer_contribution":0.0,"corpus_percentile":0.0,"corpus_rank":765,"citation_count":0,"citer_count":0,"citers_with_citation_signal":0,"citers_with_endowment":0,"datacite_reuse_total":0,"is_dataset":true,"is_dataset_confidence":0.8796,"is_oa":true,"file_count":0,"downloads":0,"has_version_chain":false,"published_date":"2026-02-06","fair_score":59.1667,"fair_percentile":92.10642040457344,"algorithm_id":"datarank_citation_only_1hop_v6","ranking_scope":"data_only","authors":[{"id":71984,"name":"Elin Org","orcid":null,"position":1,"is_corresponding":false},{"id":71985,"name":"Org Elin","orcid":null,"position":2,"is_corresponding":false},{"id":71983,"name":"Kateryna Pantiukh","orcid":"0000-0002-2595-0673","position":0,"is_corresponding":true}],"reference_count":33,"raw_metadata":{"citation_network_status":"fetched"},"created_at":"2026-03-01T18:20:47.508186Z","pmid":"41651883","pmcid":"PMC12988187","fwci":null,"citation_percentile":null,"influential_citations":0,"oa_status":null,"license":null,"views":0,"total_file_size_bytes":0,"version_count":0,"fair_f":77.5,"fair_a":80.0,"fair_i":37.5,"fair_r":41.6667,"fair_zscore":1.2623,"fair_rationale":{"fair_score":59.17,"has_llm":true,"dimensions":{"F":{"name":"Findable","score":77.5,"criteria":[{"key":"f_has_doi","label":"Has a persistent DOI","kind":"deterministic","weight":1.0,"fraction":1.0,"signal":"DOI present","rationale":null},{"key":"f_repository_presence","label":"Indexed in repositories / literature DBs","kind":"deterministic","weight":1.0,"fraction":1.0,"signal":"datacite=0, pmcid=True, pmid=True","rationale":null},{"key":"f_persistent_ids","label":"Resolvable scholarly identifiers (OpenAlex)","kind":"deterministic","weight":0.5,"fraction":0.0,"signal":"no OpenAlex id","rationale":null},{"key":"f_metadata_richness","label":"Rich, machine-readable metadata","kind":"llm","weight":1.0,"fraction":0.75,"signal":null,"rationale":"FASTA and XLSX tabular metadata files are provided on Figshare, but the description does not confirm machine-readability beyond basic formats."}]},"A":{"name":"Accessible","score":80.0,"criteria":[{"key":"a_open_access","label":"Open Access / files deposited","kind":"deterministic","weight":1.5,"fraction":1.0,"signal":"Open Access","rationale":null},{"key":"a_retrievable","label":"Free full text retrievable","kind":"deterministic","weight":1.0,"fraction":0.0,"signal":"0 OA location(s)","rationale":null},{"key":"a_access_protocol","label":"Clear data/code access protocol","kind":"llm","weight":1.0,"fraction":1.0,"signal":null,"rationale":"MAGs are deposited in ENA (PRJEB81541) without access restrictions, and descriptive metadata are on Figshare, with public, persistent access via HTTPS."}]},"I":{"name":"Interoperable","score":37.5,"criteria":[{"key":"i_linked_data","label":"Linked datasets / DataCite relations","kind":"deterministic","weight":1.0,"fraction":0.0,"signal":"linked_datasets=0, datacite=0","rationale":null},{"key":"i_standard_ids","label":"References data via standard accessions","kind":"deterministic","weight":1.0,"fraction":0.0,"signal":"accessions=0, trials=0","rationale":null},{"key":"i_standards","label":"Standard formats, vocabularies & identifiers","kind":"llm","weight":1.0,"fraction":0.75,"signal":null,"rationale":"Standard file formats (FASTA, XLSX) and identifiers (ENA, Figshare DOIs) are used, but no explicit use of formal ontologies or community-standard metadata schemas is stated."}]},"R":{"name":"Reusable","score":41.67,"criteria":[{"key":"r_license","label":"Clear, open reuse license","kind":"deterministic","weight":1.5,"fraction":0.0,"signal":"no license","rationale":null},{"key":"r_downloads","label":"Demonstrated reuse (downloads)","kind":"deterministic","weight":0.5,"fraction":0.0,"signal":"downloads=0","rationale":null},{"key":"r_version","label":"Versioned / maintained","kind":"deterministic","weight":0.5,"fraction":0.0,"signal":"no version chain","rationale":null},{"key":"r_dataset","label":"Classified as a data resource","kind":"deterministic","weight":0.5,"fraction":1.0,"signal":"is_dataset","rationale":null},{"key":"r_reusability","label":"Data-availability statement, license & reproducibility","kind":"llm","weight":2.0,"fraction":0.667,"signal":null,"rationale":"A data‑availability statement, CC BY‑NC‑ND license, and GitHub code are provided, but the license restricts adaptations and secondary use, limiting full reusability."}]}},"suggestions":["Add JSON-LD, RDF, or XML metadata with community-standard ontology terms to improve machine findability.","Deposit metadata in a repository that supports API access (e.g., Zenodo) to enhance automated retrieval.","Explicitly reference the MIxS (Minimum Information about any (x) Sequence) checklist in the metadata.","Adopt a more permissive license (e.g., CC BY 4.0 or CC0) to enable adaptation and maximize reuse.","Include a README file with formal requirements for reuse, such as required software versions and parameter files."],"model":"deepseek/deepseek-v4-flash","agent_version":"fair_agent_v2","fulltext_source":"epmc_xml"},"fair_model":"deepseek/deepseek-v4-flash","fair_agent_version":"fair_agent_v2","fair_fulltext_source":"epmc_xml","fair_has_llm":true,"fair_computed_at":"2026-06-18T06:48:37.839806Z","clinical_trials":[],"software_tools":[],"db_accessions":[],"linked_datasets":[],"topics":[]}