{"biothing_type":"dataset","build_date":"2026-04-02T12:58:10.229574-07:00","build_version":"20260402","src":{"zenodo":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/zenodo/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"4b20474","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/4b204746768542946ec207bbbf1a91cd1eff2f55/biothings-hub/files/nde-hub/hub/dataload/sources/zenodo/uploader.py"},"stats":{"zenodo":4446684},"download_date":"2025-10-05T18:04:35.629000","version":"2025-10-05T17:58:19Z","upload_date":"2025-04-14T21:37:08.404000","sourceInfo":{"name":"Zenodo","abstract":"Zenodo is a GREI repository that includes most data types and domains.","description":"The OpenAIRE project, in the vanguard of the open access and open data movements in Europe was commissioned by the EC to support their nascent Open Data policy by providing a catch-all repository for EC funded research. CERN, an OpenAIRE partner and pioneer in open source, open access and open data, provided this capability and Zenodo was launched in May 2013.","schema":{"title":"name","header":"dateModifed, url","description":"description","date":"datePublished","language":"inLanguage.name","subject":"keywords","relatedIdentifier":"topicCategory","xml[DOI]":"doi","xml[resourceTypeGeneral]":"@type","xml[creator][creatorName]":"author.name","xml[creator][affiliation]":"author.affiliation","xml[creator][nameIdentifier]":"author.identifier","xml[rights]":"conditionsOfAccess, license","xml[relatedIdentifier][relationType]":"citedBy","xml[contributor][contributorName]":"funding.funder.name"},"url":"https://zenodo.org/","identifier":"Zenodo","conditionsOfAccess":"Varied","genre":"Generalist","schedule":"Quarterly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.296,"avg_required_ratio":0.7893,"required_fields":{"name":1.0,"description":0.9601,"author":1.0,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.0959,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0955,"doi":0.9999,"infectiousAgent":0.0,"healthCondition":0.0,"species":0.0,"variableMeasured":0.0,"citation":0.0,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.6149,"license":0.8588,"sdPublisher":0.5322,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":7.06,"sum_recommended_coverage":6.1,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"binary_required_score":8,"binary_recommended_score":8,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.89,"percent_recommended_fields":0.38,"conditionsOfAccess":"Varied"}}},"reframedb":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/reframedb/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/reframedb/uploader.py"},"stats":{"reframedb":400},"download_date":"2026-03-28T07:00:53.939000","version":"2026-03-28T07:00:53Z","upload_date":"2026-03-07T08:01:00.083000","sourceInfo":{"name":"ReframeDB","abstract":"ReframeDB is a Calibr maintained repository that has a screening set of 12,000 compounds for drug repositioning.","description":"The ReFRAME collection of 12,000 compounds is a best-in-class drug repurposing library containing nearly all small molecules that have reached clinical development or undergone significant preclinical profiling. The purpose of such a screening collection is to enable rapid testing of compounds with demonstrated safety profiles in new indications, such as neglected or rare diseases, where there is less commercial motivation for expensive research and development.","schema":{"assay_id":"identifer","assay_title":"name","title_short":"alternateName","authors":"author","summary":"description","purpose":"description","protocol":"description","readout":"description","detection_method":"description","detection_reagents":"description","components":"description","drug_conc":"description","indication":"healthCondition","assay_type":"measurementTechnique","bibliography":"citation"},"url":"https://reframedb.org/","identifier":"ReframeDB","conditionsOfAccess":"Restricted","genre":"IID","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0969,"avg_augmented_required_ratio":0.0006,"avg_recommended_score_ratio":0.0976,"avg_required_ratio":0.6747,"required_fields":{"name":1.0,"description":1.0,"author":0.9947,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.0532,"date":0.0},"recommended_fields":{"dateCreated":0.0,"dateModified":0.0,"datePublished":0.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.5957,"healthCondition":1.0,"species":0.5745,"variableMeasured":0.0,"citation":0.0532,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.7394,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":6.05,"sum_recommended_coverage":3.96,"required_augmented_fields_coverage":{"funding":0.01,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.57,"infectiousAgent":0.6,"healthCondition":0.05,"citation":0.05,"topicCategory":0.74},"binary_required_score":7,"binary_recommended_score":6,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.78,"percent_recommended_fields":0.29,"conditionsOfAccess":"Unknown"}}},"bei":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/bei/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f412d64","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f412d643a53caff279b75126ea141a96ef3358c1/biothings-hub/files/nde-hub/hub/dataload/sources/bei/uploader.py"},"stats":{"bei":14392},"download_date":"2026-03-31T22:08:16.820000","version":"2026-03-31T22:08:15Z","upload_date":"2026-03-31T22:08:20.065000"},"hca":{"sourceInfo":{"abstract":"The Human Cell Atlas is a repository that includes multimodal data of cells in the human body.","description":"Thanks to new single cell genomics and spatial imaging technologies developed since the late 2000s and early 2010s, it is now possible to measure gene expression profiles in individual cells. These large scale data can be used with machine learning algorithms to decipher how the cells differ from and interact with their neighbors, and how they form and function in the tissue. This now allows scientists to identify and understand cell types in unprecedented detail, resolution and breadth. The Human Cell Atlas (HCA) is an international group of researchers using a combination of these new technologies to create cellular reference maps with the position, function and characteristics of every cell type in the human body.","identifier":"Human Cell Atlas","name":"Human Cell Atlas","schema":{"entryId":"url, _id","projectTitle":"name","projectDescription":"description","institution":"author.affiliation","laboratory":"author.affiliation","contactName":"author.name","projectRole":"author.role","email":"author.email","publicationTitle":"ncitation.ame","publicationUrl":"citation.url","doi":"citation.doi","supplementaryLinks":"mainEntityOfPage, isBasedOn.codeRepository","accession":"sameAs","accessible":"isAccessibleForFree","effectiveOrgan":"keywords","organ":"keywords","organPart":"keywords","disease":"healthCondition.name","genusSpecies":"species","lastModifiedDate":"dateModified","submissionDate":"datePublished"},"url":"https://www.humancellatlas.org/","conditionsOfAccess":"Varied","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.2853,"avg_required_ratio":0.67,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.0,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.0,"healthCondition":0.8421,"species":0.9979,"variableMeasured":0.0,"citation":0.9853,"conditionsOfAccess":0.0,"isBasedOn":0.0989,"keywords":1.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":6.0,"sum_recommended_coverage":5.92,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"binary_required_score":6,"binary_recommended_score":7,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.67,"percent_recommended_fields":0.33,"conditionsOfAccess":"Unknown"}},"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/hca/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/hca/uploader.py"},"stats":{"hca":528},"download_date":"2026-03-28T07:02:18.799000","version":"2026-03-28T07:02:18Z","upload_date":"2026-03-28T07:02:20.081000"},"microbiomedb":{"sourceInfo":{"abstract":"MicrobiomeDB is a NIAID supported repository that includes clinical microbiome data and analysis tools.","description":"MicrobiomeDB was developed as a discovery tool that empowers researchers to fully leverage their experimental metadata to construct queries that interrogate microbiome datasets.","name":"MicrobiomeDB","identifier":"MicrobiomeDB","schema":{"displayName":"name","study_categories":"keywords","type":"keywords","description":"description","institution":"contributor.affiliation","contact":"contributor.name","study_access":"conditionsOfAccess","email":"contributor.email","card_points":"description","card_headline":"doi","summary":"abstract","dataset_id":"identifier","dataset_name":"alternateName","pmids_download":"citation, funding","contacts":"author","DownloadVersion":"distribution","Publications":"citation, funding","AssociatedDatasets":"isPartOf, isRelatedTo","HyperLinks":"url"},"url":"https://microbiomedb.org/mbio/app","conditionsOfAccess":"Open","genre":"IID","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.17,"avg_augmented_required_ratio":0.03,"avg_recommended_score_ratio":0.1055,"avg_required_ratio":0.76,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.8182,"date":0.0},"recommended_fields":{"dateCreated":0.0,"dateModified":0.0,"datePublished":0.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.8182,"healthCondition":0.8636,"species":0.9545,"variableMeasured":0.0,"citation":0.9545,"conditionsOfAccess":1.0,"isBasedOn":0.0,"keywords":1.0,"license":0.0,"sdPublisher":0.1364,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":6.82,"sum_recommended_coverage":5.73,"required_augmented_fields_coverage":{"funding":0.27,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.95,"infectiousAgent":0.82,"healthCondition":0.86,"citation":0.95,"topicCategory":0.0},"binary_required_score":7,"binary_recommended_score":7,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.78,"percent_recommended_fields":0.33,"conditionsOfAccess":"Open"}},"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/microbiomedb/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/microbiomedb/uploader.py"},"stats":{"microbiomedb":25},"download_date":"2026-03-28T07:00:05.458000","version":"2026-03-28T07:00:05Z","upload_date":"2026-03-28T07:00:10.086000"},"emdb":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/emdb/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"a451b02","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/a451b02d3521c2dd1adb00661e8de32cdc41da2d/biothings-hub/files/nde-hub/hub/dataload/sources/emdb/uploader.py"},"stats":{"emdb":2881},"download_date":"2026-03-28T16:07:13.153000","version":"2026-03-28T16:07:12Z","upload_date":"2026-03-28T16:07:20.083000","sourceInfo":{"abstract":"Electron Microscopy Data Bank (EMDB) is a generalist repository that includes image data.","description":"The Electron Microscopy Data Bank (EMDB) is a public repository for cryogenic-sample Electron Microscopy (cryoEM) volumes and representative tomograms of macromolecular complexes and subcellular structures. It covers a variety of techniques, including single-particle analysis, helical reconstruction, electron tomography, subtomogram averaging, and electron crystallography (for more information, see the EMDB Policies).","identifier":"Electron Microscopy Data Bank","name":"Electron Microscopy Data Bank (EMDB)","schema":{"natural_source_ncbi_code":"species.identifier","sample.supramolecule_list.supramolecule.natural_source.organism.valueOf_":"species.name","admin.key_dates.deposition":"dateCreated","admin.key_dates.update":"dateModified","admin.grant_support.grant_reference.code":"funding.identifier","admin.grant_support.grant_reference.funding_body":"funding.funder.name","facet_record_count":"collectionSize.minValue"},"url":"https://www.ebi.ac.uk/emdb/","conditionsOfAccess":"Open","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.4798,"avg_required_ratio":0.7498,"total_documents":2875,"required_fields":{"name":1.0,"description":1.0,"author":0.0,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.7256,"date":0.9962},"recommended_fields":{"dateCreated":0.9962,"dateModified":0.9962,"datePublished":0.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.5527,"healthCondition":0.0,"species":0.4473,"variableMeasured":1.0,"citation":0.0,"conditionsOfAccess":1.0,"isBasedOn":1.0,"keywords":0.0,"license":1.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.9962,"topicCategory":1.0,"identifier":0.0,"usageInfo":1.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"sum_required_coverage":6.7218,"sum_recommended_coverage":9.9886,"binary_required_score":7,"binary_recommended_score":11,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.7778,"percent_recommended_fields":0.5238,"conditionsOfAccess":"Open"}}},"omicsdi":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/omicsdi/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/omicsdi/uploader.py"},"stats":{"omicsdi":111007},"download_date":"2026-04-01T17:19:56.217000","version":"2026-04-01T17:19:30Z","url":"https://www.omicsdi.org/search","license_url":"https://www.ebi.ac.uk/licencing","upload_date":"2026-04-01T17:20:00.575000","sourceInfo":{"name":"OmicsDI","abstract":"Omics Discovery Index (OmicsDI) is a generalist repository that is part of ELIXIR infrastructure that includes multi-omics data for most domains.","description":"The Omics Discovery Index (OmicsDI) provides a knowledge discovery framework across heterogeneous omics data (genomics, proteomics, transcriptomics and metabolomics).","schema":{"_id":"identifer","citation":"citation","creator":"author","description":"description","distribution":"distribution","keywords":"keywords","name":"name","sameAs":"sameAs","variableMeasured":"variableMeasured"},"url":"https://www.omicsdi.org/","identifier":"Omics Discovery Index (OmicsDI)","conditionsOfAccess":"Unknown","genre":"Generalist","schedule":"Quarterly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0876,"avg_augmented_required_ratio":0.0219,"avg_recommended_score_ratio":0.0686,"avg_required_ratio":0.6191,"required_fields":{"name":0.9726,"description":0.9945,"author":0.739,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":0.739,"funding":0.2337,"date":0.0},"recommended_fields":{"dateCreated":0.0,"dateModified":0.0,"datePublished":0.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.1005,"healthCondition":0.3809,"species":0.425,"variableMeasured":0.2995,"citation":0.5328,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.0082,"license":0.0,"sdPublisher":0.739,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.5421,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":5.68,"sum_recommended_coverage":3.03,"required_augmented_fields_coverage":{"funding":0.2,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.42,"infectiousAgent":0.05,"healthCondition":0.27,"citation":0.53,"topicCategory":0.54},"binary_required_score":7,"binary_recommended_score":8,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.78,"percent_recommended_fields":0.38,"conditionsOfAccess":"Unknown"}}},"immunespace":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/immunespace/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/immunespace/uploader.py"},"stats":{"immunespace":204},"download_date":"2026-03-28T23:00:03.157000","version":"2026-03-28T23:00:02Z","upload_date":"2026-03-28T23:00:10.095000","sourceInfo":{"abstract":"ImmuneSpace is a NIAID supported IID repository that includes immune data.","description":"The Human Immunology Project Consortium (HIPC) program was established in 2010, and renewed in 2015 and in 2022, by the NIAID Division of Allergy, Immunology, and Transplantation as part of the overall NIAID focus on human immunology. Through this program, well-characterized human cohorts are studied using a variety of modern analytic tools, including multiplex transcriptional, cytokine, and proteomic assays; multiparameter phenotyping of leukocyte subsets; assessment of leukocyte functional status; and multiple computational methods.Through the HIPC program, centralized research resources and a comprehensive, centralized database will be constructed for use by the greater scientific community. The information gained from the HIPC program will provide a comprehensive understanding of the human immune system and its regulation and will reveal novel associations between components of the immune system and other biological systems, identify novel immune mediators and pathways, establish predictors of vaccine safety in different populations, and enable the rapid evaluation of different vaccine formulations and administration regimens in human populations. This knowledge base will also serve as a foundation for the future study of immune-mediated diseases in the human, such as allergy, asthma, transplant rejection, autoimmune diseases, and a variety of inflammatory diseases.","identifier":"ImmuneSpace","name":"ImmuneSpace","schema":{"_id":"identifer","creator":"author","citations":"citedBy","identifers":"identifer","species":"species","measurementTechnique":"measurementTechnique","distribution":"distribution","includedInDataCatalog":"includedInDataCatalog","date":"date"},"url":"https://www.immunespace.org/","conditionsOfAccess":"Closed","genre":"IID","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.05,"avg_required_ratio":0.22,"total_documents":204,"required_fields":{"name":0.0,"description":0.0,"author":0.0,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.0,"date":0.0},"recommended_fields":{"dateCreated":0.0,"dateModified":0.0,"datePublished":0.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"species":1.0,"variableMeasured":0.0,"citation":0.0,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"sum_required_coverage":2.0,"sum_recommended_coverage":1.0,"binary_required_score":2,"binary_recommended_score":1,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.2222,"percent_recommended_fields":0.0476,"conditionsOfAccess":"Unknown"}}},"clingen":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/clingen/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"3575467","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/35754672805545a6ec1ada43bf9f1c7a429cc3a2/biothings-hub/files/nde-hub/hub/dataload/sources/clingen/uploader.py"},"stats":{"clingen":2160},"download_date":"2026-03-28T15:04:04.344000","version":"2026-03-28T15:03:53Z","upload_date":"2026-03-28T15:04:10.072000","sourceInfo":{"abstract":"ClinicalGenomeResource (ClinGen) is a NIH supported generalist repository that includes genomic data.","description":"ClinGen is a National Institutes of Health (NIH)-funded resource dedicated to building an authoritative central resource that defines the clinical relevance of genes and variants for use in precision medicine and research.","name":"ClinicalGenomeResource (ClinGen)","schema":{"DISEASE ID (MONDO)":"healthCondition.identifier","DISEASE LABEL":"healthCondition.name","GENE SYMBOL":"geneSymbol","GENE ID (HGNC)":"geneId","#Variation":"variantId","Uuid":"variantId","HGVS Expressions":"hgvsExpressions","GCEP":"author","Expert Panel":"author","CLASSIFICATION DATE":"dateModified","Published Date":"dateModified","Approval Date":"dateModified","CLASSIFICATION":"clinicalSignificance","Assertion":"clinicalSignificance","Mode of Inheritance":"modeOfInheritance","MOI":"modeOfInheritance","Applied Evidence Codes (Met)":"appliedEvidenceCodesMet","Applied Evidence Codes (Not Met)":"appliedEvidenceCodesNotMet","Summary of interpretation":"summaryOfInterpretation","Guideline":"guideline","Retracted":"retracted","ONLINE REPORT":"url","Evidence Repo Link":"url"},"url":"https://clinicalgenome.org/","conditionsOfAccess":"Open","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.4773,"avg_required_ratio":0.89,"total_documents":2154,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":1.0,"date":1.0},"recommended_fields":{"dateCreated":1.0,"dateModified":1.0,"datePublished":0.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.0,"healthCondition":1.0,"species":1.0,"variableMeasured":1.0,"citation":0.0,"conditionsOfAccess":1.0,"isBasedOn":1.0,"keywords":0.0,"license":1.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.9461,"identifier":0.0,"usageInfo":1.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"sum_required_coverage":8.0,"sum_recommended_coverage":9.9461,"binary_required_score":8,"binary_recommended_score":10,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.8889,"percent_recommended_fields":0.4762,"conditionsOfAccess":"Open"}}},"veupathdb":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/veupathdb/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/veupathdb/uploader.py"},"stats":{"veupathdb":3225},"download_date":"2026-03-28T11:00:55.152000","version":"2026-03-28T11:00:54Z","upload_date":"2026-03-28T11:01:00.085000","sourceInfo":{"name":"VEuPathDB","abstract":"The Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) is a NIAID supported IID repository that includes genomic and phenotypic data for eukaryotic pathogens and invertebrate vectors of infectious disease.","description":"The Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) is one of two Bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). VEuPathDB provides access to diverse genomic and other large scale datasets related to eukaryotic pathogens and invertebrate vectors of disease. Organisms supported by this resource include (but are not limited to) the NIAID list of emerging and re-emerging infectious diseases.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://veupathdb.org/veupathdb/app/","identifier":"VEuPathDB","conditionsOfAccess":"Closed","genre":"IID","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0837,"avg_augmented_required_ratio":0.0296,"avg_recommended_score_ratio":0.1792,"avg_required_ratio":0.8735,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":0.9997,"includedInDataCatalog":1.0,"distribution":0.566,"funding":0.4244,"date":0.9692},"recommended_fields":{"dateCreated":0.0,"dateModified":0.9649,"datePublished":0.6005,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.5203,"healthCondition":0.1765,"species":0.319,"variableMeasured":0.2128,"citation":0.6946,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.0,"license":0.0,"sdPublisher":1.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":7.96,"sum_recommended_coverage":5.49,"required_augmented_fields_coverage":{"funding":0.27,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.32,"infectiousAgent":0.52,"healthCondition":0.18,"citation":0.69,"topicCategory":0.0},"binary_required_score":9,"binary_recommended_score":9,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":1.0,"percent_recommended_fields":0.43,"conditionsOfAccess":"Closed"}}},"biostudies":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/biostudies/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"81a1713","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/81a1713823182b67a87e1180636ef0cfb05f0f49/biothings-hub/files/nde-hub/hub/dataload/sources/biostudies/uploader.py"},"stats":{"biostudies":107822},"download_date":"2026-02-05T18:51:57.085000","version":"2026-02-05T18:39:14Z","upload_date":"2026-02-06T19:17:34.375000","sourceInfo":{"abstract":"BioStudies is a repository that includes life sciences data by organising links to data in other databases at EMBL-EBI or elsewhere.","description":"The mission of BioStudies is to provide access to all the data outputs of a life sciences study from a single place, by organising links to data in other databases at EMBL-EBI or elsewhere, as well as hosting data and metadata that do not fit anywhere else. The database accepts submissions via an online tool, or in a simple tab-delimited format. BioStudies provides rich mechanisms for defining and using metadata guidelines specific for a particular data source such as a project or a community, and organises datasets in collections.","identifier":"BioStudies","name":"BioStudies","schema":{"attachto":"url","releasedate":"datePublished","doi":"doi","title":"name","abstract":"description","description":"description","acknowledgements":"description","funding statement":"description","keywords":"keywords","license":"license","organism":"species.name","method":"measurementTechnique.name","study type":"measurementTechnique.name","experimental design":"measurementTechnique.name","experimental factor":"variablesMeasured.name","files":"distribution","links":"isRelatedTo","authors":"author","organization":"author.affiliation","funding":"funding","image acquisition":"measurementTechnique.name","assays and data":"measurementTechnique.name","publication":"citation"},"url":"https://www.ebi.ac.uk/biostudies/","conditionsOfAccess":"Unknown","genre":"Generalist","schedule":"Manual","metadata_completeness":{"avg_augmented_recommended_ratio":0.0418,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.1092,"avg_required_ratio":0.7348,"total_documents":107822,"required_fields":{"name":1.0,"description":0.8587,"author":0.8944,"url":1.0,"measurementTechnique":0.7505,"includedInDataCatalog":1.0,"distribution":0.0622,"funding":0.0345,"date":0.9975},"recommended_fields":{"dateCreated":0.0,"dateModified":0.0,"datePublished":0.9975,"citedBy":0.0,"doi":0.0121,"infectiousAgent":0.1141,"healthCondition":0.0,"species":0.709,"variableMeasured":0.0027,"citation":0.2479,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.0091,"license":0.148,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.8362,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.8361},"sum_required_coverage":6.5978,"sum_recommended_coverage":3.0766,"binary_required_score":9,"binary_recommended_score":9,"binary_required_augmented":0,"binary_recommended_augmented":1,"percent_required_fields":1.0,"percent_recommended_fields":0.4286,"conditionsOfAccess":"Unknown"}}},"vivli":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/vivli/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/vivli/uploader.py"},"stats":{"vivli":8427},"download_date":"2026-03-28T12:21:43.481000","version":"2026-03-28T12:21:41Z","url":"https://search.vivli.org/","license_url":"https://vivli.org/resources/vivli-data-use-agreement/","upload_date":"2026-03-28T12:21:50.081000","sourceInfo":{"name":"Vivli","abstract":"Vivli is a GREI repository that includes most data types and domains.","description":"Vivli is an independent non-profit organization launched in 2016. Vivli evolved from a project of The Multi-Regional Clinical Trials Center of Brigham and Women’s Hospital and Harvard(MRCT Center) to enhance access to clinical trials data by promoting data sharing and transparency. In 2013, the MRCT Center and a diverse group of global stakeholders embarked on a mission to define, design, and launch an innovative platform solution for global clinical trial data sharing. The Vivli platform provides access to anonymized individual participant-level data(IPD) or the raw data that is collected during a clinical trial. The clinical trials represented in Vivli are global and contributed by a diverse group of data contributors. By serving as a global trusted platform, Vivli increases the discoverability of available data in the wider research ecosystem, and increases the overall capacity worldwide for effective data sharing, aggregation, re-use, and novel analysis of valuable clinical research data to advance science and improve public health. The Vivli platform is a cloud-based platform that consists of a dynamic search engine, a data repository, and a secure research environment.","schema":{"nctId":"identifer","secondaryIds":"identifier","registryInfo":"sdPublishers","principalInvestigator":"author","studyTitle":"name","leadSponsor":"funding","collaborators":"funding","studyStartDate":"temporalInterval.startDate","actualStudyCompletionDate":"temporalInterval.endDate","locationsOfStudySites":"spatialCoverage","phase":"keywords","studyType":"keywords","conditions":"healthCondition.name","outcomeNames":"variable_measured","digitalObjectId":"doi","studyMetadataDoi":"doi","extractedBriefSummary":"description","draftCreatedDate":"dateCreated","postedDate":"datePublished","updatedDate":"dateModified"},"url":"https://vivli.org/","identifier":"Vivli","conditionsOfAccess":"Restricted","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0462,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.4671,"avg_required_ratio":0.7549,"required_fields":{"name":1.0,"description":0.7716,"author":1.0,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.9999,"date":1.0},"recommended_fields":{"dateCreated":1.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0,"doi":1.0,"infectiousAgent":0.0,"healthCondition":0.9235,"species":0.0,"variableMeasured":0.7437,"citation":0.0,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.9884,"license":0.0,"sdPublisher":1.0,"spatialCoverage":0.6792,"temporalCoverage":0.7651,"topicCategory":0.9246,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":6.77,"sum_recommended_coverage":11.02,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.92},"binary_required_score":7,"binary_recommended_score":12,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.78,"percent_recommended_fields":0.57,"conditionsOfAccess":"Unknown"}}},"hubmap":{"sourceInfo":{"abstract":"The Human BioMolecular Atlas Program (HuBMAP) is an NIH supported repository that includes multimodal data of healthy cells in the human body.","description":"HuBMAP is part of a rich ecosystem of established and emerging atlasing programs supported by NIH and globally by other funding organizations, many of which are focused on specific organs or diseases. HuBMAP has connected with these programs to ensure data interoperability, avoid duplication of work, and leverage and synergize gained knowledge. The consortium has organized a number of events to bring together these communities to discuss topics of shared interest and is committed to improving coordination and collaboration among different programs. In addition, many of the HuBMAP PIs had been or are still actively participating in these efforts, helping with cross-pollination and advancing our global understanding. HuBMAP, as its name implies, was specifically initiated to resolve the challenge of building integrated, comprehensive, high-resolution spatial maps of human tissues and organs, which has resulted in HuBMAP providing leadership in the ecosystem around techniques for integrating disparate, multi-dimensional and multi-scale datasets, the development of a Common Coordinate Framework (CCF) for integrating data across many individuals, and the development and validation of these assays. To further increase interoperability, HuBMAP has adopted a number of standards and processes developed by other domain expert consortia, working and is actively involved in the knowledge exchange. The consortium sees itself as an integral part of the ecosystem, sharing its strengths and actively contributing to the community.","identifier":"HuBMAP","name":"HuBMAP","schema":{"hubmap_id":"name","title":"description","anatomy_0":"keywords","anatomy_1":"keywords","anatomy_2":"keywords","display_subtype":"keywords","contacts.affiliation":"author.affiliation","contacts.first_name":"author.givenName","contacts.last_name":"author.familyName","contacts.middle_name_or_initial":"author.givenName","contacts.name":"author.name","contacts.orcid_id":"author.identifier","contributors.affiliation":"author.affiliation","contributors.first_name":"author.givenName","contributors.last_name":"author.familyName","contributors.middle_name_or_initial":"author.givenName","contributors.name":"author.name","contributors.orcid_id":"author.identifier","created_timestamp":"dateCreated","last_modified_timestamp":"dateModified","published_timestamp":"datePublished","data_access_level":"isAccessibleForFree","data_types":"measurementTechnique.name","dataset_info":"measurementTechnique.description","doi_url":"doi","uuid":"url","file.description":"distribution.name","file.mapped_description":"distribution.description","file.rel_path":"distribution.contentUrl","file.size":"distribution.contentSize","file.type":"distribution.encodingFormat","version":"version","metadata.dag_provenance_list":"isBasedOn.name","metadata.protocols_io_doi":"isBasedOn.doi"},"url":"https://hubmapconsortium.org/","conditionsOfAccess":"Varied","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0316,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.2762,"avg_required_ratio":0.7547,"required_fields":{"name":1.0,"description":1.0,"author":0.7521,"url":1.0,"measurementTechnique":0.7699,"includedInDataCatalog":1.0,"distribution":0.2483,"funding":0.0,"date":1.0},"recommended_fields":{"dateCreated":1.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0,"doi":0.7517,"infectiousAgent":0.0,"healthCondition":0.0,"species":0.0,"variableMeasured":0.0,"citation":0.0,"conditionsOfAccess":0.0,"isBasedOn":0.9729,"keywords":1.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.636,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":6.77,"sum_recommended_coverage":6.36,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.63},"binary_required_score":8,"binary_recommended_score":7,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.89,"percent_recommended_fields":0.33,"conditionsOfAccess":"Unknown"}},"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/hubmap/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/hubmap/uploader.py"},"stats":{"hubmap":10119},"download_date":"2026-03-28T15:49:59.694000","version":"2026-03-28T15:49:43Z","upload_date":"2026-03-28T15:50:00.079000"},"clinepidb":{"sourceInfo":{"abstract":"ClinEpiDB is a NIAID supported IID repository that includes epidemiological data.","description":"ClinEpiDB, launched in February 2018, is an open-access exploratory data analysis platform. We integrate data from high quality epidemiological studies, and offer tools and visualizations to explore the data within the browser in a point and click interface. We enable investigators to maximize the utility and reach of their data and to make optimal use of data released by others. ClinEpiDB is led by a team of scientists and developers based at the University of Pennsylvania, the University of Georgia, Imperial College London, and several other academic institutions. Currently, we are funded by the Bill and Melinda Gates Foundation for resource development and data integration, and by NIAID for integration of data from the International Centers of Excellence in Malaria Research (ICEMR).","identifier":"ClinEpiDB","name":"ClinEpiDB","schema":{"Study_Design":"measurementTechnique","description":"description","summary":"description","WHO":"keywords","Participant_Type":"keywords","Country":"spatialCoverage","study_access":"conditionOfAccess","Years":"temporalCoverage","disease":"healthCondition","Publications":"citation","release_date":"distribution.dateModified","dataset_name":"distribution.name","contact_name":"author.name","Contacts":"affiliation","HyperLinks":"isBasedOn.url"},"url":"https://clinepidb.org/ce/app","conditionsOfAccess":"Varied","genre":"IID","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.1238,"avg_augmented_required_ratio":0.0592,"avg_recommended_score_ratio":0.362,"avg_required_ratio":0.9389,"total_documents":65,"required_fields":{"name":1.0,"description":1.0,"author":0.9692,"url":1.0,"measurementTechnique":0.9692,"includedInDataCatalog":1.0,"distribution":0.9692,"funding":0.6923,"date":0.9692},"recommended_fields":{"dateCreated":0.0,"dateModified":0.9692,"datePublished":0.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.0154,"healthCondition":1.0,"species":0.0308,"variableMeasured":0.9385,"citation":0.8769,"conditionsOfAccess":1.0,"isBasedOn":0.9692,"keywords":0.9846,"license":0.0,"sdPublisher":0.0,"spatialCoverage":1.0,"temporalCoverage":0.9692,"topicCategory":0.7692,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.5385,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0308,"infectiousAgent":0.0154,"healthCondition":0.9231,"citation":0.8769,"topicCategory":0.7692},"sum_required_coverage":8.5691,"sum_recommended_coverage":10.523,"binary_required_score":9,"binary_recommended_score":13,"binary_required_augmented":1,"binary_recommended_augmented":5,"percent_required_fields":1.0,"percent_recommended_fields":0.619,"conditionsOfAccess":"Varied"}},"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/clinepidb/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/clinepidb/uploader.py"},"stats":{"clinepidb":65},"download_date":"2026-03-28T15:03:39.880000","version":"2026-03-28T15:03:39Z","upload_date":"2026-03-28T15:03:40.079000"},"qiita":{"sourceInfo":{"abstract":"Qiita is a repository that includes microbiome data and analysis tools.","description":"Qiita(canonically pronounced cheetah) is an entirely open-source microbial study management platform. It allows users to keep track of multiple studies with multiple 'omics data. Additionally, Qiita is capable of supporting multiple analytical pipelines through a 3rd-party plugin system, allowing the user to have a single entry point for all of their analyses. Qiita provides database and compute resources to the global community, alleviating the technical burdens that are typically limiting for researchers studying microbial ecology(e.g. familiarity with the command line or access to compute power).Qiita's platform allows for quick reanalysis of the datasets that have been deposited using the latest analytical technologies. This means that Qiita's internal datasets are living data that is periodically re-annotated according to current best practices.","identifier":"Qiita","name":"Qiita","schema":{"study_abstract":"description","study_id":"url","study_alias":"_id","study_title":"name","study_tags":"keywords","pi":"author","pubs":"doi,pmids","ebi_study_accession":"mainEntityOfPage"},"url":"https://qiita.ucsd.edu/","conditionsOfAccess":"Unknown","genre":"IID","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.1248,"avg_augmented_required_ratio":0.0181,"avg_recommended_score_ratio":0.0429,"avg_required_ratio":0.5869,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.2957,"date":0.0},"recommended_fields":{"dateCreated":0.0,"dateModified":0.0,"datePublished":0.0,"citedBy":0.0,"doi":0.5067,"infectiousAgent":0.3055,"healthCondition":0.3755,"species":0.6282,"variableMeasured":0.0,"citation":0.4429,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.3521,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.8626,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":5.3,"sum_recommended_coverage":3.47,"required_augmented_fields_coverage":{"funding":0.16,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.63,"infectiousAgent":0.31,"healthCondition":0.38,"citation":0.44,"topicCategory":0.86},"binary_required_score":6,"binary_recommended_score":7,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.67,"percent_recommended_fields":0.33,"conditionsOfAccess":"Unknown"}},"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/qiita/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/qiita/uploader.py"},"stats":{"qiita":876},"download_date":"2026-03-21T15:00:24.635000","version":"2026-03-21T15:00:13Z","upload_date":"2026-03-21T15:00:30.091000"},"ndex":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/ndex/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/ndex/uploader.py"},"stats":{"ndex":11297},"download_date":"2026-04-02T18:19:02.786000","version":"2026-04-02T18:18:51Z","upload_date":"2026-04-02T18:19:10.091000","sourceInfo":{"name":"The Network Data Exchange (NDEx)","abstract":"The Network Data Exchange (NDEx) is a NIH supported generalist repository that includes generalist data.","description":"The NDEx Project provides an open-source framework where scientists and organizations can store, share, manipulate, and publish biological network knowledge. One of the goals of the project is to create a home for models that are currently available only as figures, tables, or supplementary information, such as networks produced via systematic mining and integration of large-scale molecular data. The NDEx project does not compete with existing pathway and interaction databases, such as Pathway Commons, KEGG, or Reactome; instead, NDEx provides a novel, common distribution channel for these efforts, preserving their identity and attribution rather than subsuming them.","schema":{"name":"name","description":"description","creationTime":"dateCreated","modificationTime":"dateModified","lastmodifieddate":"dateModified","ndex:modificationTime":"dateModified","visibility":"conditionsOfAccess","cxFileSize":"distribution.contentSize","cxFormat":"distribution.encodingFormat","author":"author.name","rightsHolder":"author.name","owner":"author.name","bel:author":"author.name","Author":"author.name","disease":"healthCondition","diseases_id":"healthCondition","organism":"species","species":"species","idmapper.species":"species","species_common_name":"species","ORGANISM":"species","reference":"isRelatedTo.url","figureTitle":"isRelatedTo.name","figureLink":"isRelatedTo.url","uri":"isRelatedTo.url","rights":"license","license":"license","bel:copyright":"license","doi":"doi","labels":"keywords","network type":"keywords","networkType":"keywords","dc:type":"keywords","wikipathwaysIRI":"sameAs","URI":"sameAs","KEGG_PATHWAY_LINK":"sameAs","prov:wasDerivedFrom":"wasDerivedFrom","pmcid":"citation.pmcid","paperTitle":"citation.name","paperLink":"citation.url","Data source":"sdPublisher","TCGA Data Source":"sdPublisher","source":"sdPublisher","dc:date":"date","dataSource":"isBasedOn","Source":"isBasedOn","Treatment":"variableMeasured","methods":"measurementTechnique"},"url":"https://www.ndexbio.org/","identifier":"NDEx","conditionsOfAccess":"Open","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.3766,"avg_required_ratio":0.8564,"required_fields":{"name":1.0,"description":0.9477,"author":1.0,"url":1.0,"measurementTechnique":0.7469,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.0,"date":1.0},"recommended_fields":{"dateCreated":1.0,"dateModified":1.0,"datePublished":0.0,"citedBy":0.0,"doi":0.0033,"infectiousAgent":0.0009,"healthCondition":0.5188,"species":0.9238,"variableMeasured":0.0,"citation":0.7447,"conditionsOfAccess":1.0,"isBasedOn":0.0031,"keywords":0.9174,"license":0.7727,"sdPublisher":0.0006,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":7.69,"sum_recommended_coverage":7.89,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"binary_required_score":8,"binary_recommended_score":13,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.89,"percent_recommended_fields":0.62,"conditionsOfAccess":"Open"}}},"ark":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/ark/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/ark/uploader.py"},"stats":{"ark":26},"download_date":"2026-04-01T18:45:58.863000","version":"2026-04-01T18:45:47Z","upload_date":"2026-04-01T18:46:00.079000","sourceInfo":{"abstract":"SAGE ARK Portal is a NIAID supported IID repository that includes immune data.","description":"The SAGE Arthritis and Autoimmune and Related Diseases (ARK Portal) is a public data repository that stores and shares data and research knowledge generated by a network of research teams focused on arthritis and autoimmune and related diseases. The ARK Portal is funded by the National Institute of Arthritis and Musculoskeletal and Skin Diseases (NIAMS), and the National Institute of Allergy and Infectious Diseases (NIAID). It is developed and maintained by Sage Bionetworks.","identifier":"SAGE ARK Portal","name":"SAGE ARK Portal","schema":{"name":"name","description":"description","createdOn":"dateCreated","modifiedOn":"dateModified","program":"author.name","datasetStatus":"conditionsOfAccess","datasetType, dataSubtype":"keywords","assay, dataType":"measurementTechnique.name","biospecimenType":"sample.anatomicalStructure.name","biospecimenSubtype":"sample.anatomicalStructure.sampleType","diagnosis":"healthCondition.name","doi":"doi","acknowledgmentStatement":"creditText","publicationSynID":"citation","associatedCodeURL":"isRelatedTo.codeRepository","dbGapAccession, ImmPortAccession":"identifier"},"url":"https://arkportal.synapse.org/","conditionsOfAccess":"Varied","genre":"IID","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.4815,"avg_required_ratio":0.9958,"total_documents":26,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.9615,"date":1.0},"recommended_fields":{"dateCreated":1.0,"dateModified":1.0,"datePublished":0.0,"citedBy":0.0,"doi":1.0,"infectiousAgent":0.0,"healthCondition":1.0,"species":0.0,"variableMeasured":0.0,"citation":0.0385,"conditionsOfAccess":1.0,"isBasedOn":0.0,"keywords":1.0,"license":1.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":1.0,"identifier":1.0,"usageInfo":1.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"sum_required_coverage":8.9615,"sum_recommended_coverage":10.0385,"binary_required_score":9,"binary_recommended_score":11,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":1.0,"percent_recommended_fields":0.5238,"conditionsOfAccess":"Restricted"}}},"biosample":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/biosample/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f0127ab","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f0127ab903563b7b054a678d2cae1b5405eb634e/biothings-hub/files/nde-hub/hub/dataload/sources/biosample/uploader.py"},"stats":{"biosample":52930808},"download_date":"2026-03-13T05:42:27.436000","version":"2026-03-13T05:18:53Z","upload_date":"2026-03-14T04:01:03.978000","sourceInfo":{"abstract":"NCBI BioSample is a NIH supported generalist repository that includes other data.","description":"NCBI BioSample is a NIH supported generalist repository that includes other data.","identifier":"NCBI BioSample","name":"NCBI BioSample","url":"https://www.ncbi.nlm.nih.gov/biosample/","conditionsOfAccess":"Open","genre":"Generalist","schedule":"Manual","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.2706,"avg_required_ratio":0.6529,"total_documents":52930808,"required_fields":{"name":1.0,"description":0.0107,"author":0.8037,"url":1.0,"measurementTechnique":0.03,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.0,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.297,"healthCondition":0.1494,"species":0.5647,"variableMeasured":0.2345,"citation":0.0,"conditionsOfAccess":1.0,"isBasedOn":0.0529,"keywords":0.0642,"license":0.0,"sdPublisher":0.2973,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"sum_required_coverage":5.8444,"sum_recommended_coverage":5.66,"binary_required_score":8,"binary_recommended_score":11,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.8889,"percent_recommended_fields":0.5238,"conditionsOfAccess":"Varied"}}},"tycho":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/tycho/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"30feb0a","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/30feb0ad31c8882ca54feeae98d8ea9afe7facb5/biothings-hub/files/nde-hub/hub/dataload/sources/tycho/uploader.py"},"stats":{"tycho":597},"download_date":"2025-12-06T20:06:37.293000","version":"2026-03-14T19:06:27Z","upload_date":"2025-12-06T20:06:40.094000","sourceInfo":{"abstract":"Project TYCHO is a NIH supported IID repository that includes clinical data.","description":"The Project Tycho Repository for Global Health Data aims to advance the availabilty and use of data for improving global health. Project Tycho unlocks global health data to a rapidly growing user community of over 3,000 researchers, students, journalists, officials, and others in over 90 countries. A Project Tycho dataset includes case counts for a disease condition in a country. Data for Project Tycho datasets can come from various sources and have been pre-processed into the standard Project Tycho data format.","identifier":"Project Tycho","name":"Project Tycho","schema":{"identifier.identifier":"doi","identifier.identifierSource":"includedInDataCatalog.name","title":"name","description":"description","dates.date":"datePublished, dateModified, dateCreated","storedIn.dates.date":"datePublished, dateModified, dateCreated","storedIn.access.landingPage":"url","storedIn.licenses.identifier.identifier":"license","spatialCoverage":"spatialCoverage","types":"variableMeasured, measurementTechnique","refinement":"keywords","distributions.access.landingPage":"distribution.contentUrl","distributions.access.authorizations.value":"conditionsOfAccess","distributions.formats":"distribution.encodingFormat","creators":"author","licenses.identifier.identifier":"license","acknowledges.funders":"funding.funder","acknowledges.awardees":"author","relatedIdentifiers.identifier.identifier":"isBasedOn.url","dates.type.value":"datePublished, dateModified, dateCreated, temporalCoverage","isAbout":"infectousAgent, healthCondition, variableMeasured"},"url":"https://www.tycho.pitt.edu/","genre":"IID","conditionsOfAccess":"Closed","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.6859,"avg_required_ratio":1.0,"total_documents":597,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":1.0,"funding":1.0,"date":1.0},"recommended_fields":{"dateCreated":1.0,"dateModified":0.0,"datePublished":1.0,"citedBy":0.0,"doi":1.0,"infectiousAgent":1.0,"healthCondition":1.0,"species":1.0,"variableMeasured":1.0,"citation":0.0,"conditionsOfAccess":1.0,"isBasedOn":0.397,"keywords":1.0,"license":1.0,"sdPublisher":0.0,"spatialCoverage":1.0,"temporalCoverage":1.0,"topicCategory":1.0,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"sum_required_coverage":9.0,"sum_recommended_coverage":14.397,"binary_required_score":9,"binary_recommended_score":15,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":1.0,"percent_recommended_fields":0.7143,"conditionsOfAccess":"Closed"}}},"dataverse":{"sourceInfo":{"abstract":"Harvard Dataverse is a GREI repository that includes most data types and domains.","description":"The Harvard Dataverse Repository is a free data repository open to all researchers from any discipline, both inside and outside of the Harvard community, where you can share, archive, cite, access, and explore research data. Each individual Dataverse collection is a customizable collection of datasets (or a virtual repository) for organizing, managing, and showcasing datasets.","identifier":"Harvard Dataverse","name":"Harvard Dataverse","schema":{"@context":"@context","@type":"@type","identifier":["url","doi","identifier"],"name":"name","creator":"author","author":"author","datePublished":"datePublished","dateModified":"dateModified","description":"description","keywords":"keywords","citation":"citation.citation","license":"license","includedInDataCatalog":"includedInDataCatalog","publisher":"sdPublisher","funder":"funder","distribution":"distribution","type":"@type","global_id":"doi","published_at":"datePublished","identifier_of_dataverse":"sdPublisher.identifier","name_of_dataverse":"sdPublisher.name","subjects":"topicCategory","createdAt":"dateCreated","updatedAt":"dateModified","authors":"author.name"},"url":"https://dataverse.harvard.edu/","conditionsOfAccess":"Varied","genre":"Generalist","schedule":"Quarterly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0215,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.3738,"avg_required_ratio":0.7131,"total_documents":295448,"required_fields":{"name":1.0,"description":0.9286,"author":0.998,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":0.3721,"funding":0.1069,"date":1.0},"recommended_fields":{"dateCreated":1.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0,"doi":1.0,"infectiousAgent":0.0383,"healthCondition":0.0536,"species":0.1052,"variableMeasured":0.0,"citation":0.6387,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.6924,"license":0.3739,"sdPublisher":1.0,"spatialCoverage":0.1563,"temporalCoverage":0.0336,"topicCategory":0.2346,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.1049,"infectiousAgent":0.0375,"healthCondition":0.0532,"citation":0.0,"topicCategory":0.2345},"sum_required_coverage":6.4056,"sum_recommended_coverage":8.3266,"binary_required_score":8,"binary_recommended_score":15,"binary_required_augmented":0,"binary_recommended_augmented":4,"percent_required_fields":0.8889,"percent_recommended_fields":0.7143,"conditionsOfAccess":"Varied"}},"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/dataverse/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/dataverse/uploader.py"},"stats":{"dataverse":295448},"download_date":"2026-04-02T15:55:06.558000","version":"2026-04-02T00:02:58Z","upload_date":"2026-04-02T15:55:10.090000"},"lincs":{"sourceInfo":{"abstract":"The Library of Integrated Network-Based Cellular Signatures (LINCS) Data Portal is an NIH supported repository that includes gene expression and other cellular processes data.","description":"The BD2K-LINCS DCIC is comprised of four major components: Integrated Knowledge Environment (IKE), Data Science Research (DSR), Community Training and Outreach (CTO) and Consortium Coordination and Administration (CCA). The Center is constructing a high-capacity scalable integrated knowledge environment enabling federated access, intuitive querying and integrative analysis and visualization across all LINCS resources and many additional external data types from other relevant resources. The Center’s data science research projects are aimed at addressing various data integration and intracellular molecular regulatory network challenges. The Center aims to develop: 1) methods to connect cellular and organismal phenotypes with molecular cellular signatures, and 2) novel data visualization methods for dynamically interacting with large-genomics and proteomics datasets.","identifier":"LINCS","name":"LINCS","schema":{"centerdatasetid":"url","funding":"funding","assayoverview":"description","centerurl":"author.url","description":"description","principalinvestigator":"author.name","centerfullname":"author.affiliation","datemodified":"dateUpdated","screeninglabinvestigator":"author.name","datasetname":"name","datasetid":"identifier","datereleased":"datePublished","assayname":"measurementTechnique","assayformat":"measurementTechnique","assaydesignmethod":"keywords","physicaldetection":"variableMeasured","biologicalprocess":"keywords","technologies":"keywords","biologicalbucket":"keywords","endpointcategorization":"keywords","size":"distribution.contentSize","datasetgroup":"isRelatedTo","toollink":"isBasedOn","tool":"isBasedOn","protocol":"isBasedOn.url","protein":"keywords"},"url":"https://lincsportal.ccs.miami.edu/","conditionsOfAccess":"Unknown","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0416,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.2549,"avg_required_ratio":0.9772,"required_fields":{"name":1.0,"description":0.8915,"author":1.0,"url":1.0,"measurementTechnique":0.9906,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.9222,"date":0.9882},"recommended_fields":{"dateCreated":0.0,"dateModified":0.691,"datePublished":0.9882,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.0,"healthCondition":0.0024,"species":0.0165,"variableMeasured":0.9788,"citation":0.0,"conditionsOfAccess":0.0,"isBasedOn":0.6392,"keywords":1.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.8137,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":8.79,"sum_recommended_coverage":6.13,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.02,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.81},"binary_required_score":9,"binary_recommended_score":9,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":1.0,"percent_recommended_fields":0.43,"conditionsOfAccess":"Unknown"}},"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/lincs/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/lincs/uploader.py"},"stats":{"lincs":424},"download_date":"2026-03-07T16:00:08.648000","version":"2026-03-07T16:00:08Z","upload_date":"2026-03-07T16:00:10.059000"},"malariagen":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/malariagen/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/malariagen/uploader.py"},"stats":{"malariagen":59},"download_date":"2026-03-28T19:00:50.390000","version":"2026-03-28T19:00:49Z","upload_date":"2026-03-28T19:01:00.090000","sourceInfo":{"name":"MalariaGEN","abstract":"Malaria Genomic Epidemiology Network (MalariaGEN) is a IID repository that includes clinical data.","description":"MalariaGEN is an international network of researchers focused on understanding the genetic variations in humans, Plasmodium parasites, and Anopheles mosquitoes to better control malaria transmission. By leveraging advanced genomic tools and techniques, MalariaGEN aims to uncover how genetic differences influence susceptibility to malaria, track insecticide resistance in mosquitoes, and detect drug resistance in parasites. The network's efforts are crucial for developing new interventions and maintaining the effectiveness of existing ones. Coordinated from the Wellcome Sanger Institute in the UK, MalariaGEN collaborates with over 200 partners across more than 40 countries, primarily in malaria-endemic regions.","schema":{"title":"name","released on":"datePublished","project":"isPartOf","url":"identifier","keywords":"keywords","datasets":"distribution","citations":"citation","data package contact":"author","spatialCoverage":"spatialCoverage"},"url":"https://www.malariagen.net/","identifier":"MalariaGEN","conditionsOfAccess":"Varied","genre":"IID","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.05,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.19,"avg_required_ratio":0.78,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.0,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":0.0,"datePublished":1.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.0,"healthCondition":1.0,"species":0.0,"variableMeasured":0.0,"citation":1.0,"conditionsOfAccess":1.0,"isBasedOn":0.0,"keywords":1.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":7.0,"sum_recommended_coverage":5.0,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":1.0,"citation":0.0,"topicCategory":0.0},"binary_required_score":7,"binary_recommended_score":5,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.78,"percent_recommended_fields":0.24,"conditionsOfAccess":"Varied"}}},"dde":{"license":"Creative Commons Attribution 4.0 International","code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/dde/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"2132891","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/213289125e5b25073d0d145d9239e4267f6acd9e/biothings-hub/files/nde-hub/hub/dataload/sources/dde/uploader.py"},"stats":{"dde":660},"download_date":"2026-03-21T20:06:53.863000","version":"2026-03-21T20:06:53Z","url":"https://discovery.biothings.io/api/dataset/","license_url":"https://creativecommons.org/licenses/by/4.0/","upload_date":"2026-03-21T20:07:00.102000","sourceInfo":{"name":"Data Discovery Engine","abstract":"The Data Discovery Engine is a NIAID supported metadata registry that includes metadata from IID and general repositories.","description":"The Data Discovery Engine is a streamlined process to create, distribute and harves findable metadata via interoperable Schema.org schemas. The biomedical and informatics communities have largely endorsed the spirit and basic components of the FAIR Data Principles. Biomedical data producers, including CTSA hubs, need actionable best-practice guidance on how to make their data discoverable and reusable, and bring the practical benefits of data sharing to researcher's own research projects, as well as the research community as a whole.","schema":{"creator":"author","_id":"identifier","date_created":"dateCreated","last_updated":"dateModifed","@type":"@type","measurementTechnique":"measurementTechnique","infectiousAgent":"infectiousAgent","infectiousDisease":"infectiousDisease","species":"species"},"url":"https://discovery.biothings.io/","identifier":"Data Discovery Engine","conditionsOfAccess":"Varied","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0588,"avg_augmented_required_ratio":0.018,"avg_recommended_score_ratio":0.3244,"avg_required_ratio":1.0,"total_documents":660,"required_fields":{"name":1.0,"description":1.0,"author":0.9985,"url":1.0,"measurementTechnique":0.9242,"includedInDataCatalog":1.0,"distribution":0.903,"funding":1.0,"date":1.0},"recommended_fields":{"dateCreated":1.0,"dateModified":1.0,"datePublished":0.2576,"citedBy":0.053,"doi":0.0076,"infectiousAgent":0.6,"healthCondition":0.6379,"species":0.4955,"variableMeasured":0.0909,"citation":0.6061,"conditionsOfAccess":0.0879,"isBasedOn":0.053,"keywords":0.0606,"license":0.2227,"sdPublisher":0.7106,"spatialCoverage":0.1152,"temporalCoverage":0.1152,"topicCategory":0.647,"identifier":1.0,"usageInfo":0.0561,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.1545,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0152,"healthCondition":0.3636,"citation":0.2894,"topicCategory":0.5561},"sum_required_coverage":8.8257,"sum_recommended_coverage":7.8169,"binary_required_score":9,"binary_recommended_score":20,"binary_required_augmented":1,"binary_recommended_augmented":4,"percent_required_fields":1.0,"percent_recommended_fields":0.9524,"conditionsOfAccess":"Varied"}}},"ncbi_bioproject":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/ncbi_bioproject/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/ncbi_bioproject/uploader.py"},"stats":{"ncbi_bioproject":1052279},"download_date":"2026-03-28T23:09:52.302000","version":"2026-03-28T23:09:00Z","upload_date":"2026-03-28T23:10:00.086000","sourceInfo":{"abstract":"NCBI BioProject is a NIH supported generalist repository that includes multiomic data.","description":"A BioProject is a collection of biological data related to a single initiative, originating from a single organization or from a consortium. A BioProject record provides users a single place to find links to the diverse data types generated for that project.","identifier":"NCBI BioProject","name":"NCBI BioProject","schema":{"ProjectDescr/Title":"name","ProjectDescr/Name":"name","ProjectDescr/Description":"description","ProjectID/ArchiveID/@accession":"identifier, url, _id","Submission/@submitted":"datePublished","Submission/@last_update":"dateModified","ProjectDataTypeSet/DataType":"variableMeasured","IntendedDataTypeSet/DataType":"variableMeasured","Objectives/Data/@data_type":"variableMeasured","ProjectTypeSubmission/Method/@method_type":"measurementTechnique","ProjectTypeSubmission/Target/Organism/@taxID":"species.identifier","ProjectTypeSubmission/Target/Organism/OrganismName":"species.name","ProjectDescr/Grant/@GrantId":"funding.identifier","ProjectDescr/Grant/Title":"funding.name","ProjectDescr/Grant/Agency/@abbr":"funding.funder.alternateName","ProjectDescr/Grant/Agency":"funding.funder.name","ProjectDescr/Grant/PI/Given":"author.givenName","ProjectDescr/Grant/PI/Last":"author.familyName","ProjectDescr/Grant/PI/@affil":"author.affiliation.name","ProjectTypeSubmission/Target/Provider":"author.name","Submission/Description/Organization/Name":"author.name","Submission/Description/Organization/@role":"author.role","ProjectDescr/Publication/@id":"citation.pmid, citation.pmcid","ProjectLinks/Link/ProjectIDRef/@accession":"hasPart.identifier, isPartOf.identifier","Submission/Description/Access":"conditionsOfAccess","ProjectDescr/Relevance/Medical":"keywords","ProjectTypeSubmission/Target/@sample_scope":"keywords"},"url":"https://www.ncbi.nlm.nih.gov/bioproject/","conditionsOfAccess":"Open","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.2182,"avg_required_ratio":0.6518,"total_documents":1048978,"required_fields":{"name":1.0,"description":0.9687,"author":0.0143,"url":1.0,"measurementTechnique":0.9674,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.0612,"date":0.826},"recommended_fields":{"dateCreated":0.0,"dateModified":0.0,"datePublished":0.826,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.2937,"healthCondition":0.0,"species":0.5505,"variableMeasured":0.9394,"citation":0.0,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.9438,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"sum_required_coverage":5.8376,"sum_recommended_coverage":4.5534,"binary_required_score":8,"binary_recommended_score":6,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.8889,"percent_recommended_fields":0.2857,"conditionsOfAccess":"Unknown"}}},"ncbi_sra":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/ncbi_sra/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"2132891","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/213289125e5b25073d0d145d9239e4267f6acd9e/biothings-hub/files/nde-hub/hub/dataload/sources/ncbi_sra/uploader.py"},"stats":{"ncbi_sra":658401},"download_date":"2026-04-02T15:59:59.608000","version":"2026-04-02T15:54:52Z","upload_date":"2026-04-02T16:00:00.076000","sourceInfo":{"abstract":"Sequence Read Archive (SRA) is the NIH supported largest publicly available repository of high throughput sequencing data that includes raw sequencing data and alignment information for most domains.","description":"Sequence Read Archive(SRA) data, available through multiple cloud providers and NCBI servers, is the largest publicly available repository of high throughput sequencing data. The archive accepts data from all branches of life as well as metagenomic and environmental surveys. SRA stores raw sequencing data and alignment information to enhance reproducibility and facilitate new discoveries through data analysis.","identifier":"NCBI SRA","name":"NCBI SRA","schema":{"Accession":"url","Updated":"dateModified","Published":"datePublished","Recieved":"dateCreated","Visibility":"conditionsOfAccess","ReplacedBy":"sameAs","study_title":"name","study_abstract":"description","contact_name":"author","GCP_url":"contentUrl","GCP_free_egress":"isAccessibleForFree","AWS_url":"contentUrl","AWS_free_egress":"isAccessibleForFree","organism_taxid":"species.identifier","organism_name":"species.name","run_accession":"isBasedOn.identifier","BioProject":"isBasedOn.identifier","experiment_accession":"isBasedOn.identifier","sample_accession":"isBasedOn.identifier","instrument":"isBasedOn.identifier","cell line":"isBasedOn.identifier","HapMap sample ID":"isBasedOn.identifier"},"url":"https://www.ncbi.nlm.nih.gov/sra","conditionsOfAccess":"Varied","genre":"Generalist","schedule":"Quarterly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0749,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.1401,"avg_required_ratio":0.5522,"required_fields":{"name":1.0,"description":0.9347,"author":0.0,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.0,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.4626,"healthCondition":0.0982,"species":0.2128,"variableMeasured":0.0,"citation":0.0,"conditionsOfAccess":0.0,"isBasedOn":1.0,"keywords":0.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.7381,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":4.93,"sum_recommended_coverage":4.51,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.21,"infectiousAgent":0.46,"healthCondition":0.1,"citation":0.0,"topicCategory":0.74},"binary_required_score":5,"binary_recommended_score":7,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.56,"percent_recommended_fields":0.33,"conditionsOfAccess":"Unknown"}}},"acd_niaid":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/acd_niaid/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/acd_niaid/uploader.py"},"stats":{"acd_niaid":12},"download_date":"2026-04-02T18:22:31.073000","version":"2026-04-02T18:22:16Z","upload_date":"2026-04-02T18:22:40.092000","sourceInfo":{"name":"AccessClinicalData@NIAID","abstract":"AccessClinicalData is a NIAID supported IID repository that includes clinical trials data.","description":"AccessClinicalData@NIAID is a NIAID cloud-based, secure data platform that enables sharing of and access to reports and data sets from NIAID COVID-19 and other sponsored clinical trials for the basic and clinical research community.","schema":{"title":"name","cmc_unique_id":"identifier","brief_summary":"description","data_availability_date":"datePublished","most_recent_update":"dateModified","data_available":"additionalType","creator":"funding.funder.name","nct_number":"nctid, identifier","condition":"healthCondition","clinical_trial_website":"mainEntityOfPage","publications":"citation","data_available_for_request":"conditionsOfAccess"},"url":"https://accessclinicaldata.niaid.nih.gov/","identifier":"AccessClinicalData@NIAID","conditionsOfAccess":"Varied","genre":"IID","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0567,"avg_augmented_required_ratio":0.0825,"avg_recommended_score_ratio":0.2517,"avg_required_ratio":0.6425,"total_documents":12,"required_fields":{"name":1.0,"description":1.0,"author":0.0,"url":1.0,"measurementTechnique":0.5833,"includedInDataCatalog":1.0,"distribution":0.0,"funding":1.0,"date":0.75},"recommended_fields":{"dateCreated":0.0,"dateModified":0.25,"datePublished":0.75,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.0833,"healthCondition":1.0,"species":0.1667,"variableMeasured":0.0,"citation":0.6667,"conditionsOfAccess":1.0,"isBasedOn":0.0,"keywords":0.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.5,"identifier":1.0,"usageInfo":1.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.1667,"measurementTechnique":0.5833},"recommended_augmented_fields_coverage":{"species":0.1667,"infectiousAgent":0.0833,"healthCondition":0.1667,"citation":0.25,"topicCategory":0.5},"sum_required_coverage":6.3333,"sum_recommended_coverage":6.4167,"binary_required_score":7,"binary_recommended_score":10,"binary_required_augmented":2,"binary_recommended_augmented":5,"percent_required_fields":0.7778,"percent_recommended_fields":0.4762,"conditionsOfAccess":"Restricted"}}},"immport":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/immport/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/immport/uploader.py"},"stats":{"immport":1419},"download_date":"2026-03-28T19:16:16.040000","version":"2026-03-28T19:16:05Z","url":"https://www.immport.org/shared/home","license_url":"https://docs.immport.org/home/agreement/","upload_date":"2026-03-28T19:16:20.403000","sourceInfo":{"name":"ImmPort","abstract":"The Immunology Database and Analysis Portal (ImmPort) is a NIAID supported IID repository that includes multimodal immunological data.","description":"The ImmPort project provides advanced information technology support in the archiving and exchange of scientific data for the diverse community of life science researchers supported by NIAID/DAIT and serves as a long-term, sustainable archive of research and clinical data. The core component of ImmPort is an extensive data warehouse containing experimental data and metadata describing the purpose of the study and the methods of data generation. The functionality of ImmPort will be expanded continuously over the life of the BISC project to accommodate the needs of expanding research communities. The shared research and clinical data, as well as the analytical tools in ImmPort are available to any researcher after registration.","schema":{"_id":"identifer","creator":"author","citations":"citedBy","identifers":"identifer","species":"species","measurementTechnique":"measurementTechnique","distribution":"distribution","includedInDataCatalog":"includedInDataCatalog","date":"date"},"url":"https://www.immport.org/shared/home","identifier":"ImmPort - Bioinformatics For the Future of Immunology","conditionsOfAccess":"Closed","genre":"IID","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0528,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.3232,"avg_required_ratio":0.9048,"required_fields":{"name":1.0,"description":1.0,"author":0.6759,"url":1.0,"measurementTechnique":0.4586,"includedInDataCatalog":1.0,"distribution":1.0,"funding":1.0,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":0.0,"datePublished":0.0,"citedBy":0.8442,"doi":1.0,"infectiousAgent":0.2707,"healthCondition":0.9991,"species":0.1567,"variableMeasured":0.0,"citation":0.0,"conditionsOfAccess":0.0,"isBasedOn":0.9875,"keywords":1.0,"license":1.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.6402,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":8.13,"sum_recommended_coverage":7.9,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.16,"infectiousAgent":0.27,"healthCondition":0.0,"citation":0.0,"topicCategory":0.64},"binary_required_score":9,"binary_recommended_score":10,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":1.0,"percent_recommended_fields":0.48,"conditionsOfAccess":"Unknown"}}},"pdb":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/pdb/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/pdb/uploader.py"},"stats":{"pdb":142356},"download_date":"2026-03-28T17:35:17.402000","version":"2026-03-28T17:34:51Z","upload_date":"2026-03-28T17:35:20.074000","sourceInfo":{"abstract":"Protein Data Bank is a NIAID supported generalist repository that includes structure data.","description":"RCSB PDB (RCSB.org) is the US data center for the global Protein Data Bank (PDB) archive of 3D structure data for large biological molecules (proteins, DNA, and RNA) essential for research and education in fundamental biology, health, energy, and biotechnology. The RSCB PDB hosts ~240 K structures from the PDB archive; however, only the subset of the RSCB PDB that was funded by NIAID or has a potentially pathogenic organism is included in the Discovery Portal.","identifier":"Protein Data Bank","name":"Protein Data Bank","schema":{"organisms":"species.name","struct.title":"name, description","rscb_id":"_id, identifier, doi","audit_author":"author","citation":"citation","exptl":"measurementTechnique","pdb_audit_support":"funding","rcsb_accession_info.deposit_date":"datePublished","rcsb_accession_info.revision_date":"dateModified","struct_keywords":"keywords","rcsb_external_references":"sameAs"},"url":"https://www.rcsb.org/","conditionsOfAccess":"Open","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.5752,"avg_required_ratio":0.9393,"total_documents":142183,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":0.9983,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.4503,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0,"doi":1.0,"infectiousAgent":0.9922,"healthCondition":0.0,"species":0.1146,"variableMeasured":1.0,"citation":0.9997,"conditionsOfAccess":1.0,"isBasedOn":0.0,"keywords":0.9983,"license":1.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":1.0,"identifier":1.0,"usageInfo":1.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"sum_required_coverage":8.4486,"sum_recommended_coverage":12.1048,"binary_required_score":9,"binary_recommended_score":13,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":1.0,"percent_recommended_fields":0.619,"conditionsOfAccess":"Open"}}},"biotools":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/biotools/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/biotools/uploader.py"},"stats":{"biotools":32927},"download_date":"2026-03-03T19:24:46.173000","version":"2026-03-03T19:24:29Z","upload_date":"2026-03-03T19:24:51.318000","sourceInfo":{"abstract":"bio.tools is an ELIXIR supported tool repository that includes information about software tools, databases and services.","description":"The use of bioinformatics is ubiquitous within the life sciences.  In bio.tools, we are striving to provide a comprehensive registry of software and databases, facilitating researchers from across the spectrum of biological and biomedical science to find, understand, utilise and cite the resources they need in their day-to-day work.\nEverything from simple command-line tools and online services, through to databases and complex, multi-functional analysis workflows is included. Resources are described in a rigorous semantics and syntax, providing end-users with the convenience of concise, consistent and therefore comparable information.\nEach bio.tools entry is assigned a human-readable, unique identifier based on the resource name, e.g. biotools:signalp.  These identifiers provide a persistent reference to our Tool Cards of essential information, as well as a means to trace resources and integrate bio.tools data with other resources.\nbio.tools was supported by ELIXIR through the  ELIXIR-EXCELERATE grant, which was funded by the European Union Horizon 2020 program under grant agreement 676559.","identifier":"bio.tools","name":"bio.tools","schema":{"name":"name","description":"description","homepage":"mainEntityOfPage","biotoolsID":"identifier, url, _id","additionDate":"datePublished","lastUpdate":"dateModified","topic":"topicCategory","function":"featureList, input, output","credit":"author, contributor, funding.funder","publication":"citation, isBasedOn, citedBy, isBasisFor","relation":"sameAs, isBasedOn, isBasisFor, hasPart, isPartOf, isRelatedTo","version":"softwareVersion","license":"license","language":"programmingLanguage","operatingSystem":"operatingSystem","link":"sdPublisher, codeRepository, isRelatedTo","download":"softwareHelp, softwareAddOn, downloadUrl, thumbnailUrl, codeRepository, availableOnDevice, applicationSuite","cost":"isAccessibleForFree","accessibility":"conditionsOfAccess","documentation":"softwareHelp","otherID":"doi","toolType":"applicationCategory","collectionID":"keywords","maturity":"creativeWorkStatus"},"url":"https://bio.tools/","genre":"Generalist","conditionsOfAccess":"Varied","type":"Computational Tool Repository","schedule":"Manual","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.4588,"avg_required_ratio":0.7901,"total_documents":32927,"required_fields":{"date":1.0,"includedInDataCatalog":1.0,"funding":0.0113,"author":0.739,"description":1.0,"name":1.0},"recommended_fields":{"citedBy":0.7203,"doi":0.001,"topicCategory":0.9824,"codeRepository":0.0924,"programmingLanguage":0.6493,"applicationCategory":0.8256,"applicationSubCategory":0.0,"input":0.1202,"output":0.099,"featureList":0.9474,"operatingSystem":0.6123,"softwareRequirements":0.0,"softwareVersion":0.1964,"citation":0.2202,"conditionsOfAccess":0.2772,"dateModified":1.0,"interactionStatistic":0.0,"license":0.4323,"identifier":1.0,"url":1.0},"required_augmented_fields_coverage":{"funding":0.0},"recommended_augmented_fields_coverage":{"citation":0.0,"topicCategory":0.0},"sum_required_coverage":4.7503,"sum_recommended_coverage":9.176,"binary_required_score":6,"binary_recommended_score":17,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":1.0,"percent_recommended_fields":0.85,"conditionsOfAccess":"Varied"}}},"node":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/node/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"6742850","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/67428509984b92187a6e025e462a7959770e9d77/biothings-hub/files/nde-hub/hub/dataload/sources/node/uploader.py"},"stats":{"node":1619},"download_date":"2026-03-31T22:00:04.814000","version":"2026-03-31T22:00:02Z","upload_date":"2026-03-31T22:00:10.064000","sourceInfo":{"abstract":"NODE is a Chinese Academy of Sciences supported generalist repository that includes multiomic data.","description":"NODE (National Omics Data Encyclopedia) is a biological big data collection platform, including the experimental sample information collection, the file upload of the sequences, and the analysis, share and download of the results. NODE platform consists of six main modules: project, sample, experiment, run, data, and analysis. Project and Sample are independent of each other, but can be linked through Run. In this way, the metadata and sequence information can be integrated.","identifier":"National Omics Data Encyclopedia","name":"National Omics Data Encyclopedia (NODE)","schema":{"projectNo":"identifier","name":"name","publishes.doi":"citation.doi","publishes.pmid":"citation.pmid","submitter.firstName":"author.givenName","submitter.lastName":"author.familyName","submitter.orgName":"author.affiliation.name","attributes.library_selection":"measurementTechnique.name","attributes.library_strategy":"measurementTechnique.name","attributes.platform":"measurementTechnique.name"},"url":"https://www.biosino.org/node/","conditionsOfAccess":"Open","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0328,"avg_augmented_required_ratio":0.0031,"avg_recommended_score_ratio":0.1368,"avg_required_ratio":0.7365,"total_documents":1611,"required_fields":{"name":1.0,"description":0.7076,"author":0.9634,"url":1.0,"measurementTechnique":0.9615,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.0366,"date":0.9634},"recommended_fields":{"dateCreated":0.9634,"dateModified":0.9634,"datePublished":0.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.013,"healthCondition":0.2222,"species":0.2924,"variableMeasured":0.0,"citation":0.1378,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0279,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.2924,"infectiousAgent":0.013,"healthCondition":0.221,"citation":0.1378,"topicCategory":0.0},"sum_required_coverage":6.6325,"sum_recommended_coverage":3.5922,"binary_required_score":8,"binary_recommended_score":7,"binary_required_augmented":1,"binary_recommended_augmented":4,"percent_required_fields":0.8889,"percent_recommended_fields":0.3333,"conditionsOfAccess":"Unknown"}}},"mendeley":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/mendeley/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/mendeley/uploader.py"},"stats":{"mendeley":138899},"download_date":"2026-03-29T02:45:31.079000","version":"2026-03-29T02:45:17Z","upload_date":"2026-03-29T02:45:40.075000","sourceInfo":{"name":"Mendeley Data","abstract":"Mendeley Data is a GREI repository that includes most data types and domains.","description":"Mendeley Data, a product of Elsevier, is one of the newest entrants in the research data repository landscape; the platform was released in April 2016. Mendeley Data is a general-purpose repository, allowing researchers in any field to upload and publish research data. Mendeley Data also allows researchers to share unpublished data privately with research collaborators.","schema":{"id":"identifer","doi":"doi","name":"name","description":"description","contributors":"contributors","files":"distribution","articles":"citation","categories":"keywords","publish_date":"datePublished","related_links":"citation","modified_on":"dateModified","links":"url","repository":"sdPublisher"},"url":"https://data.mendeley.com/","identifier":"Mendeley","conditionsOfAccess":"Varied","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0244,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.3444,"avg_required_ratio":0.6791,"required_fields":{"name":1.0,"description":0.9954,"author":1.0,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.0875,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0,"doi":1.0,"infectiousAgent":0.0,"healthCondition":0.0,"species":0.0,"variableMeasured":0.0,"citation":0.2879,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":1.0,"license":0.9992,"sdPublisher":1.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.4891,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":6.08,"sum_recommended_coverage":7.78,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.49},"binary_required_score":7,"binary_recommended_score":9,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.78,"percent_recommended_fields":0.43,"conditionsOfAccess":"Unknown"}}},"massive":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/massive/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/massive/uploader.py"},"stats":{"massive":117},"download_date":"2026-03-28T23:14:03.774000","version":"2026-03-28T23:14:03Z","upload_date":"2026-03-28T23:14:10.071000","sourceInfo":{"name":"MassIVE","abstract":"MassIVE is a NIH supported Basic science repository that includes mass spectrometry data.","description":"MassIVE is a community resource developed by the NIH-funded Center for Computational Mass Spectrometry to promote the global, free exchange of mass spectrometry data. MassIVE datasets can be assigned ProteomeXchange accessions to satisfy publication requirements.","schema":{"dataset":"identifier","task":"url","repo_path":"distribution","title":"name","site":"sdPublisher","description":"description","keywords":"keywords","create_time":"dateCreated","instrument_resolved":"measurementTechnique","species_resolved":"species","pis":"author","publications":"citation","privacy":"conditionsOfAccess"},"url":"https://massive.ucsd.edu/ProteoSAFe/static/massive.jsp","identifier":"MassIVE","conditionsOfAccess":"Open","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.015,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.2729,"avg_required_ratio":0.8024,"required_fields":{"name":0.9993,"description":0.5989,"author":0.6051,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.0,"date":1.0},"recommended_fields":{"dateCreated":1.0,"dateModified":0.0,"datePublished":0.0,"citedBy":0.0,"doi":0.4194,"infectiousAgent":0.163,"healthCondition":0.0848,"species":0.0532,"variableMeasured":0.0,"citation":0.1355,"conditionsOfAccess":1.0,"isBasedOn":0.0,"keywords":0.595,"license":0.602,"sdPublisher":1.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":7.2,"sum_recommended_coverage":6.05,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.05,"infectiousAgent":0.16,"healthCondition":0.08,"citation":0.0,"topicCategory":0.0},"binary_required_score":8,"binary_recommended_score":11,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.89,"percent_recommended_fields":0.52,"conditionsOfAccess":"Open"}}},"figshare":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/figshare/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"6977c07","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/6977c0716ac440f6f6766a70a5c8325ccf8085c3/biothings-hub/files/nde-hub/hub/dataload/sources/figshare/uploader.py"},"stats":{"figshare":1713292},"download_date":"2025-11-13T18:53:48.496000","version":"2025-11-13T18:50:29Z","upload_date":"2026-01-07T22:28:37.247000","sourceInfo":{"name":"Figshare","abstract":"Figshare is a NIH supported generalist repository that includes generalist data.","description":"Figshare is a repository where users can make all of their research outputs available in a citable, shareable and discoverable manner.","schema":{"title":"name","creator":"author","subject":"keywords","description":"description","date":"dateModified","publisher":"sdPublisher","type":"@type","identifier":"doi","language":"language","relation":"url","license":"license","issued":"datePublished","sponsor":"funding"},"url":"https://figshare.com/","identifier":"Figshare","conditionsOfAccess":"Unknown","genre":"Generalist","schedule":"Manual","metadata_completeness":{"avg_augmented_recommended_ratio":0.0269,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.3801,"avg_required_ratio":0.6792,"total_documents":1713292,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.0832,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0,"doi":0.9957,"infectiousAgent":0.1423,"healthCondition":0.1891,"species":0.2141,"variableMeasured":0.0,"citation":0.0,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":1.0,"license":1.0,"sdPublisher":1.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":1.0,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.2141,"infectiousAgent":0.1423,"healthCondition":0.186,"citation":0.0,"topicCategory":0.0},"sum_required_coverage":6.0832,"sum_recommended_coverage":8.5412,"binary_required_score":7,"binary_recommended_score":11,"binary_required_augmented":0,"binary_recommended_augmented":3,"percent_required_fields":0.7778,"percent_recommended_fields":0.5238,"conditionsOfAccess":"Unknown"}}},"veupath_collections":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/veupath_collections/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"0f12063","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/0f12063346c841ceee3cefdad4563482efaf33c2/biothings-hub/files/nde-hub/hub/dataload/sources/veupath_collections/uploader.py"},"stats":{"veupath_collections":3197},"download_date":"2026-03-28T23:00:14.055000","version":"2026-03-28T23:00:13Z","upload_date":"2026-03-28T23:00:20.373000","sourceInfo":{"name":"VEuPath Collections","abstract":"VEuPathCollections are NIAID supported IID component repositories of VEuPathDB which include collections of genomic data.","description":"VEuPath Collections is the collection of component websites of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) that have been constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). \nThe VEuPath Collections include the following component websites as individual collections: \nAmoebaDB \nCryptoDB \nGiardiaDB \nHostDB \nPlasmoDB \nVectorBase \nFungiDB \nMicrosporidiaDB \nToxoDB \nTrichDB \nTriTrypDB \nPiroplasmaDB.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://veupathdb.org/veupathdb/app/","identifier":"VEuPathDB","conditionsOfAccess":"Closed","genre":"IID","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.0,"avg_required_ratio":0.11,"required_fields":{"name":0.0,"description":0.0,"author":0.0,"url":0.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.0,"date":0.0},"recommended_fields":{"dateCreated":0.0,"dateModified":0.0,"datePublished":0.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"species":0.0,"variableMeasured":0.0,"citation":0.0,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.0,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":1.0,"sum_recommended_coverage":0.0,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.0,"healthCondition":0.0,"citation":0.0,"topicCategory":0.0},"binary_required_score":1,"binary_recommended_score":0,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.11,"percent_recommended_fields":0.0,"conditionsOfAccess":"Unknown"}}},"dbgap":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/dbgap/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/dbgap/uploader.py"},"stats":{"dbgap":2865},"download_date":"2026-03-04T20:52:02.819000","version":"2026-03-04T20:51:50Z","upload_date":"2026-03-04T20:52:10.089000","sourceInfo":{"abstract":"Database of Genotypes and Phenotypes (dbGaP) is a NIH supported IID repository that includes multiomic data.","description":"The database of Genotypes and Phenotypes (dbGaP) was developed to archive and distribute the data and results from studies that have investigated the interaction of genotype and phenotype in Humans. Such studies include genome-wide association studies, medical sequencing, molecular diagnostic assays, as well as association between genotype and non-clinical traits. The individual level data hosted at the dbGaP is distributed through a controlled access system. The types of data distributed through the dbGaP include phenotype data, association (GWAS) data, summary level analysis data, SRA (Short Read Archive) data, reference alignment (BAM) data, VCF (Variant Call Format) data, expression data, imputed genotype data, image data, etc.","identifier":"The Database of Genotypes and Phenotypes","name":"Database of Genotypes and Phenotypes (dbGaP)","schema":{"@accession":"identifier","@parentstudy":"isPartOf.identifier","@createdate":"dateCreated","@moddate":"dateModified","attributions":"author, funding","consentgroups.consentgroup.@longname":"usageInfo","description":"description","diseases.disease.@vocab_source":"healthCondition.inDefinedTermSet","diseases.disease.@vocab_term":"healthCondition.name","plaintextdescription":"description","publications.publication.pubmed.@pmid":"citation.pmid","studyhistory":"description","studyinex":"description","studynameentrez":"name","studynamereportpage":"name","studytypes.studytype":"measurementTechnique.name","studyurls.url.@name":"isRelatedTo.name","studyurls.url.@url":"isRelatedTo.url","authorizedaccess.policy.documentset.datausecertificate.@filepath":"license","authorizedaccess.policy.acknowledgementtext.para":"license","authorizedaccess.consentgroups.participantset.irbrequired":"conditionsOfAccess","authorizedaccess.policy.embargolength":"conditionsOfAccess","authorizedaccess.policy.displaypublicsummary":"conditionsOfAccess","displaypublicsummary":"conditionsOfAccess","documents":"isBasedOn"},"url":"https://www.ncbi.nlm.nih.gov/gap","genre":"Generalist","conditionsOfAccess":"Varied","schedule":"Manual","metadata_completeness":{"avg_augmented_recommended_ratio":0.1181,"avg_augmented_required_ratio":0.0536,"avg_recommended_score_ratio":0.327,"avg_required_ratio":0.8331,"total_documents":2865,"required_fields":{"name":1.0,"description":1.0,"author":0.9522,"url":1.0,"measurementTechnique":0.7578,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.7986,"date":0.9997},"recommended_fields":{"dateCreated":0.9993,"dateModified":0.9997,"datePublished":0.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.059,"healthCondition":0.8538,"species":0.4855,"variableMeasured":0.0087,"citation":0.5756,"conditionsOfAccess":1.0,"isBasedOn":0.0,"keywords":0.4328,"license":0.7337,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.8586,"identifier":1.0,"usageInfo":0.9787,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.4873,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.4855,"infectiousAgent":0.059,"healthCondition":0.4897,"citation":0.5756,"topicCategory":0.8586},"sum_required_coverage":7.5083,"sum_recommended_coverage":8.9854,"binary_required_score":8,"binary_recommended_score":13,"binary_required_augmented":1,"binary_recommended_augmented":5,"percent_required_fields":0.8889,"percent_recommended_fields":0.619,"conditionsOfAccess":"Restricted"}}},"ncbi_geo":{"code":{"gsm_ncbi_geo":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/ncbi_geo/gsm_uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/ncbi_geo/gsm_uploader.py"},"gse_ncbi_geo":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/ncbi_geo/gse_uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/ncbi_geo/gse_uploader.py"}},"stats":{"gsm_ncbi_geo":7977186,"gse_ncbi_geo":264383},"download_date":"2025-10-21T14:06:05.065000","version":"2025-10-06T23:04:37Z","upload_date":{"gsm_ncbi_geo":"2026-03-31T19:30:06.399000","gse_ncbi_geo":"2026-02-19T01:06:04.010000"},"sourceInfo":{"name":"NCBI GEO","abstract":"Gene Expression Omnibus (GEO) is an NIH supported repository that includes microarray and next-generation sequencing data for high-throughput functional genomics for most domains.","description":"GEO is a public functional genomics data repository supporting MIAME-compliant data submissions. Array- and sequence-based data are accepted. Tools are provided to help users query and download experiments and curated gene expression profiles.","schema":{"_id":"identifier","contributor(s)":"author","organization":"publisher","title":"name","organism":"species","experiment type":"measurementTechnique","summary":"description","submission date":"datePublished","last update date":"dateModified","citation(s)":"citation"},"url":"https://www.ncbi.nlm.nih.gov/geo/","identifier":"NCBI GEO","conditionsOfAccess":"Unknown","genre":"Generalist","schedule":"Manual","metadata_completeness":{"avg_augmented_recommended_ratio":0.1266,"avg_augmented_required_ratio":0.0325,"avg_recommended_score_ratio":0.14,"avg_required_ratio":0.9153,"required_fields":{"name":1.0,"description":1.0,"author":0.8403,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.4821,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.0636,"healthCondition":0.3966,"species":0.4683,"variableMeasured":0.0,"citation":0.7861,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.9369,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":8.32,"sum_recommended_coverage":5.65,"required_augmented_fields_coverage":{"funding":0.3,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.47,"infectiousAgent":0.06,"healthCondition":0.4,"citation":0.79,"topicCategory":0.94},"binary_required_score":9,"binary_recommended_score":8,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":1.0,"percent_recommended_fields":0.38,"conditionsOfAccess":"Unknown"}}},"dryad":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/dryad/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/dryad/uploader.py"},"stats":{"dryad":69163},"download_date":"2026-03-14T14:41:35.998000","version":"2026-03-14T14:41:11Z","upload_date":"2026-03-17T08:10:04.996000","sourceInfo":{"name":"Dryad Digital Repository","abstract":"Dryad Digital Repository is a GREI repository that includes most data types and domains.","description":"Dryad is an open source, community driven project that takes a unique approach to data publication and digital preservation. Dryad focuses on search, presentation, and discovery and delegates the responsibility for the data preservation function to the underlying repository with which it is integrated. Dryad aims to allow researchers to validate published findings, explore new analysis methodologies, re-purpose data for research questions unanticipated by the original authors, and perform synthetic studies such as formal meta-analyses.","schema":{"name":"name","description":"description","contentUrl":"contentUrl","identifier":"identifier, doi","keywords":"keywords","creator":"author","distribution":"distribution","temporalCoverage":"temporalCoverage","spatialCoverage":"spatialCoverage","citation":"citation","license":"license","datePublished":"datePublished","conditions":"healthCondition.name","outcomeNames":"variable_measured","digitalObjectId":"doi","studyMetadataDoi":"doi","extractedBriefSummary":"description","draftCreatedDate":"dateCreated","postedDate":"datePublished","updatedDate":"dateModified"},"url":"https://datadryad.org","identifier":"Dryad Digital Repository","conditionsOfAccess":"Open","genre":"Generalist","schedule":"Monthly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0804,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.3786,"avg_required_ratio":0.8316,"total_documents":69163,"required_fields":{"name":1.0,"description":0.9998,"author":1.0,"url":1.0,"measurementTechnique":0.0,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.4696,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":0.0,"datePublished":1.0,"citedBy":0.0,"doi":1.0,"infectiousAgent":0.0,"healthCondition":0.0819,"species":0.7546,"variableMeasured":0.0,"citation":0.908,"conditionsOfAccess":1.0,"isBasedOn":0.0,"keywords":0.8227,"license":1.0,"sdPublisher":0.0,"spatialCoverage":0.2341,"temporalCoverage":1.0,"topicCategory":0.7804,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.7546,"infectiousAgent":0.0,"healthCondition":0.0814,"citation":0.0,"topicCategory":0.7803},"sum_required_coverage":7.4694,"sum_recommended_coverage":9.5817,"binary_required_score":8,"binary_recommended_score":12,"binary_required_augmented":0,"binary_recommended_augmented":3,"percent_required_fields":0.8889,"percent_recommended_fields":0.5714,"conditionsOfAccess":"Varied"}}},"flowrepository":{"sourceInfo":{"abstract":"Flow Repository is a repository that includes flow cytometry data.","description":"FlowRepository is a database of flow cytometry experiments where you can query and download data collected and annotated according to the MIFlowCyt standard. It is primarily used as a data deposition place for experimental findings published in peer-reviewed journals in the flow cytometry field.","identifier":"Flow Repository","name":"Flow Repository","schema":{"Repository ID":"identifier","Experiment Name":"name","Primary researcher":"author.name","PI/manager":"author.name","Uploaded by":"author.name","Experiment dates":"temporalCoverage.startDate,temporalCoverage.endDate","Dataset uploaded":"datePublished","Last updated":"dateModified","Keywords":"keywords","Manuscripts":"citation,funding","Organizations":"author.affiliation.name","Purpose":"description","Conclusion":"description","Comments":"description","Funding":"funding.description","Quality control":"description"},"url":"http://flowrepository.org/","conditionsOfAccess":"Open","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.0908,"avg_augmented_required_ratio":0.0105,"avg_recommended_score_ratio":0.3142,"avg_required_ratio":0.9313,"total_documents":2277,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":1.0,"funding":0.4058,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":1.0,"datePublished":1.0,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.1577,"healthCondition":0.2148,"species":0.1774,"variableMeasured":0.0,"citation":0.3303,"conditionsOfAccess":1.0,"isBasedOn":0.0,"keywords":0.6034,"license":1.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":1.0,"topicCategory":0.9763,"identifier":1.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.0957,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.1774,"infectiousAgent":0.1577,"healthCondition":0.2139,"citation":0.3303,"topicCategory":0.9763},"sum_required_coverage":8.4058,"sum_recommended_coverage":8.4599,"binary_required_score":9,"binary_recommended_score":12,"binary_required_augmented":1,"binary_recommended_augmented":5,"percent_required_fields":1.0,"percent_recommended_fields":0.5714,"conditionsOfAccess":"Open"}},"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/flowrepository/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"77ab197","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/77ab197d75c16ac4d5c3834041a974030863a2bf/biothings-hub/files/nde-hub/hub/dataload/sources/flowrepository/uploader.py"},"stats":{"flowrepository":2277},"download_date":"2026-03-28T23:26:05.900000","version":"2026-03-28T23:26:05Z","upload_date":"2025-07-05T23:25:40.064000"},"dash":{"sourceInfo":{"abstract":"The Data and Specimen Hub (DASH) is an NICHD supported repository that includes clinical data and specimens.","description":"The NICHD Data and Specimen Hub(DASH) is a centralized resource that allows researchers to share and access de-identified data from studies funded by NICHD. DASH also serves as a portal for requesting biospecimens from selected DASH studies. DASH serves as a mechanism for NICHD-funded extramural and intramural investigators to share research data from studies in accordance with NIH Data Sharing Policies. Many of the NICHD-funded research studies also collected biospecimens that are stored in the NICHD Contracted Biorepository. To provide access to these biospecimens, DASH will store and make available to other investigators the biospecimen catalog for studies that have associated research data in DASH. By supporting data and biospecimen access through DASH, NICHD aims to accelerate scientific findings and improve human health.","identifier":"NICHD DASH","name":"NICHD Data and Specimen Hub (DASH)","schema":{"Study Name":"name","Study Abbreviation":"alternateName","citation":"citation.name","DOI":"citation.doi","Publication URLs":"citation.url","NICHD Division/Branch/Center":"funding.funder.name","Study Description":"description","Clinical Research Network Name":"author.name","Principal Investigator(s)":"author.name","Keywords":"keywords","Topic":"keywords","Requires IRB approval to obtain data":"conditionsOfAccess","Additional Approval Entity":"conditionsOfAccess","Study Type":"measurementTechnique.name","ClinicalTrials.gov URL":"mainEntityOfPage","StudyCollectionStartDate":"temporalCoverage.startDate","StudyCollectionEndDate":"temporalCoverage.endDate","approvalDate":"datePublished","Population Description":"description","descriptiveDocuments":"hasPart,isBasedOn","datasetTitle":"name","datasetDescription":"description","datasetFormat":"encodingFormat"},"url":"https://dash.nichd.nih.gov/","conditionsOfAccess":"Restricted","genre":"Generalist","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.151,"avg_augmented_required_ratio":0.0619,"avg_recommended_score_ratio":0.3098,"avg_required_ratio":1.0,"total_documents":12510,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":1.0,"funding":1.0,"date":1.0},"recommended_fields":{"dateCreated":0.0,"dateModified":0.2507,"datePublished":1.0,"citedBy":0.2476,"doi":0.0,"infectiousAgent":0.2317,"healthCondition":0.5892,"species":0.6735,"variableMeasured":0.0,"citation":0.9811,"conditionsOfAccess":1.0,"isBasedOn":1.0,"keywords":1.0,"license":0.0,"sdPublisher":0.0,"spatialCoverage":0.0,"temporalCoverage":0.9904,"topicCategory":0.9057,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.563,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.6735,"infectiousAgent":0.2317,"healthCondition":0.5892,"citation":0.7627,"topicCategory":0.9057},"sum_required_coverage":9.0,"sum_recommended_coverage":8.8699,"binary_required_score":9,"binary_recommended_score":12,"binary_required_augmented":1,"binary_recommended_augmented":5,"percent_required_fields":1.0,"percent_recommended_fields":0.5714,"conditionsOfAccess":"Varied"}},"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/dash/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"aa221fa","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/aa221faa7268c68feecb8f37737e007a41e46e09/biothings-hub/files/nde-hub/hub/dataload/sources/dash/uploader.py"},"stats":{"dash":12510},"download_date":"2025-07-06T04:36:20.927000","version":"2026-03-15T03:00:04Z","upload_date":"2025-07-06T04:36:30.090000"},"covid_radx":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/covid_radx/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"8821698","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/88216988e41196119b097fd8ba71d89bce53ae95/biothings-hub/files/nde-hub/hub/dataload/sources/covid_radx/uploader.py"},"stats":{"covid_radx":178},"download_date":"2025-03-26T22:22:26.256000","version":"2025-03-26T22:21:24Z","upload_date":"2025-04-09T21:38:07.764000","sourceInfo":{"abstract":"COVID RADx Data Hub is a NIH supported IID repository that includes clinical data.","description":"The NIH Rapid Acceleration of Diagnostics Data Hub (RADx Data Hub) is a centralized data repository that provides access to analytic tools and de-identified COVID-19 data from the RADx Initiative. The RADx Data Hub supports scientific efforts to better understand COVID-19 and factors associated with disparities in morbidity and mortality in underserved and vulnerable populations, by allowing researchers to discover, access, and perform analyses of COVID-19 datasets in a cloud-enabled platform.","identifier":"RADx Data Hub","name":"COVID RADx Data Hub","schema":{"@version":"version","created_at":"dateCreated","ct_url":"isBasedOn.url","data_species":"species.name","dcc":"sdPublisher.name","description":"description","disease_specific_related_conditions":"healthCondition.name","grant_number":"funding.funder.identifier","institution_supporting_study_array":"funding.funder.name","multi_center_sites":"author","pi_name":"author","release_date":"datePublished","publication_url":"citation, funding","source_array":"measurementTechnique.name","types_array":"measurementTechnique.name","data_general_types_array":"measurementTechnique.name","study_id":"url","population_focus_array":"keywords","topics_array":"keywords","study_website_url":"mainEntityOfPage","start_date":"temporalCoverage.startDate","end_date":"temporalCoverage.endDate","subject_array":"variablesMeasured","title":"name","updated_at":"dateModified","general_research_group":"usageInfo","health_biomed_group":"usageInfo"},"url":"https://radxdatahub.nih.gov/","conditionsOfAccess":"Unknown","genre":"IID","schedule":"Manual","metadata_completeness":{"avg_augmented_recommended_ratio":0.0785,"avg_augmented_required_ratio":0.0538,"avg_recommended_score_ratio":0.6954,"avg_required_ratio":0.89,"total_documents":178,"required_fields":{"name":1.0,"description":1.0,"author":1.0,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":1.0,"date":1.0},"recommended_fields":{"dateCreated":1.0,"dateModified":0.9888,"datePublished":1.0,"citedBy":0.0,"doi":0.9438,"infectiousAgent":1.0,"healthCondition":1.0,"species":1.0,"variableMeasured":0.9775,"citation":0.5112,"conditionsOfAccess":1.0,"isBasedOn":0.2022,"keywords":1.0,"license":1.0,"sdPublisher":1.0,"spatialCoverage":0.0,"temporalCoverage":1.0,"topicCategory":0.2809,"identifier":1.0,"usageInfo":0.9213,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.4888,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0,"infectiousAgent":0.3596,"healthCondition":0.4551,"citation":0.5112,"topicCategory":0.2809},"sum_required_coverage":8.0,"sum_recommended_coverage":15.8257,"binary_required_score":8,"binary_recommended_score":18,"binary_required_augmented":1,"binary_recommended_augmented":4,"percent_required_fields":0.8889,"percent_recommended_fields":0.8571,"conditionsOfAccess":"Restricted"}}},"vdj":{"sourceInfo":{"abstract":"VDJServer is a NIAID supported repository that includes immune repertoire sequencing data.","description":"VDJServer is a free, scalable resource for performing immune repertoire analysis and sharing data. VDJServer Community Data Portal is part of the AIRR Data Commons. Funded by a National Institute of Allergy and Infectious Diseases research grant (#1R01A1097403), the VDJServer project is led by The University of Texas Southwestern (UTSW) Medical Center in collaboration with the J. Craig Venter Institute and Yale University. The Texas Advanced Computing Center (TACC) at The University of Texas at Austin leads the cyberinfrastructure implementation, including the high performance computing (HPC) systems, storage, and software solutions.","identifier":"VDJServer","name":"VDJServer","schema":{"study.study_id":"identifier","study.study_title":"name","study.study_type.label":"measurementTechnique.name","study.study_type.id":"measurementTechnique.identifier","study.study_description":"description","study.inclusion_exclusion_criteria":"description","study.lab_name":"author.name","study.lab_address":"author.affiliation.name","study.submitted_by":"author.name","study.collected_by":"author.name","study.grants":"description","study.pub_ids":"citation, pmids","study.adc_publish_date":"datePublished","study.adc_update_date":"dateModified","study.publisher":"sdPublisher.name","download_info.archive_file":"distribution.contentUrl","download_info.download_url":"distribution.contentUrl","download_info.file_size":"distribution.contentSize","data_processing.data_processing_files":"distribution.contentUrl","sample.anatomic_site":"keywords","sample.disease_state_sample":"keywords","sample.template_class":"keywords","sample.cell_subset.label":"keywords","sample.tissue.label":"keywords","sample.cell_subset.id":"keywords","sample.tissue.id":"keywords","sample.cell_species.label":"species.name","subject.diagnosis.disease_stage":"keywords","subject.species.id":"species.identifier","subject.species.label":"species.name","subject.diagnosis.disease_diagnosis.label":"healthCondition.name","subject.diagnosis.disease_diagnosis.id":"healthCondition.identifier","assigned based on discussion":"license, usageInfo, conditionsOfAccess, variableMeasured"},"conditionsOfAccess":"Open","url":"https://vdj-staging.tacc.utexas.edu/community/","schedule":"Weekly","metadata_completeness":{"avg_augmented_recommended_ratio":0.1009,"avg_augmented_required_ratio":0.0,"avg_recommended_score_ratio":0.1072,"avg_required_ratio":0.7353,"required_fields":{"name":1.0,"description":1.0,"author":0.9844,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":0.0,"funding":0.0,"date":0.6094},"recommended_fields":{"dateCreated":0.0,"dateModified":0.6094,"datePublished":0.6094,"citedBy":0.0,"doi":0.0,"infectiousAgent":0.4062,"healthCondition":0.5781,"species":0.2188,"variableMeasured":0.0,"citation":0.0469,"conditionsOfAccess":0.0,"isBasedOn":0.0,"keywords":0.0,"license":0.0,"sdPublisher":1.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":0.8594,"identifier":0.0,"usageInfo":0.0,"interactionStatistic":0.0},"sum_required_coverage":6.59,"sum_recommended_coverage":4.33,"required_augmented_fields_coverage":{"funding":0.0,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.22,"infectiousAgent":0.41,"healthCondition":0.58,"citation":0.0,"topicCategory":0.86},"binary_required_score":7,"binary_recommended_score":8,"binary_required_augmented":0,"binary_recommended_augmented":0,"percent_required_fields":0.78,"percent_recommended_fields":0.38,"conditionsOfAccess":"Unknown"}},"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/vdj/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"f122a92","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/f122a922dc628eb78f555588b310c356be573079/biothings-hub/files/nde-hub/hub/dataload/sources/vdj/uploader.py"},"stats":{"vdj":4403},"download_date":"2026-03-29T03:23:56.993000","version":"2026-03-29T03:23:45Z","upload_date":"2026-03-29T03:24:00.070000"},"proteomexchange":{"code":{"file":"biothings-hub/files/nde-hub/hub/dataload/sources/proteomexchange/uploader.py","repo":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers.git","commit":"7cfdc98","branch":"main","url":"git@github.com:NIAID-Data-Ecosystem/nde-crawlers/tree/7cfdc98f0188559304ae036d92987bd883310a9b/biothings-hub/files/nde-hub/hub/dataload/sources/proteomexchange/uploader.py"},"stats":{"proteomexchange":51318},"download_date":"2026-04-01T09:20:18.751000","version":"2026-04-01T09:19:56Z","upload_date":"2026-04-01T09:20:20.087000","sourceInfo":{"abstract":"Proteome Xchange is a consortia supported generalist repository that includes proteomic data.","description":"The ProteomeXchange Consortium was established to provide globally coordinated standard data submission and dissemination pipelines involving the main proteomics repositories, and to encourage open data policies in the field. ProteomeXchange fully supports both MS/MS proteomics and SRM data submission. Submissions of other types of proteomics data is also possible using the Partial Submission mechanism.","identifier":"ProteomeXchange","name":"Proteome Xchange","schema":{"identifiers":"identifier","identifiers_doi":"doi","title":"name","datasetHistory":"name","description":"description","contacts":"author.name","contacts_affiliation":"author.affiliation.name","species":"species.name","species_taxid":"species.identifier","instruments":"sample.instrument.name","keywords":"keywords","datasetHistory_keywords":"keywords","publications":"citation","datasetHistory_publication":"citation","datasetSummary":"datePublished","datasetHistory_identifierDate":"dateCreated","datasetHistory_revisionDate":"dateModified","datasetHistory_submissionDate":"dateModified","datasetFiles":"distribution","datasetOrigins":"isRelatedTo","fullDatasetLinks":"sdPublisher.url","datasetSummary_hostingRepository":"sdPublisher.name"},"metadata_completeness":{"avg_augmented_recommended_ratio":0.0391,"avg_augmented_required_ratio":0.0156,"avg_recommended_score_ratio":0.5121,"avg_required_ratio":0.884,"total_documents":50761,"required_fields":{"name":1.0,"description":0.9996,"author":1.0,"url":1.0,"measurementTechnique":1.0,"includedInDataCatalog":1.0,"distribution":0.8685,"funding":0.1775,"date":1.0},"recommended_fields":{"dateCreated":0.0011,"dateModified":1.0,"datePublished":0.9999,"citedBy":0.0,"doi":0.1403,"infectiousAgent":0.2293,"healthCondition":0.3373,"species":0.8232,"variableMeasured":0.0,"citation":0.6034,"conditionsOfAccess":1.0,"isBasedOn":0.0123,"keywords":0.9972,"license":1.0,"sdPublisher":1.0,"spatialCoverage":0.0,"temporalCoverage":0.0,"topicCategory":1.0,"identifier":1.0,"usageInfo":1.0,"interactionStatistic":0.0},"required_augmented_fields_coverage":{"funding":0.1422,"measurementTechnique":0.0},"recommended_augmented_fields_coverage":{"species":0.0509,"infectiousAgent":0.0493,"healthCondition":0.3363,"citation":0.3568,"topicCategory":0.0},"sum_required_coverage":8.0456,"sum_recommended_coverage":11.144,"binary_required_score":9,"binary_recommended_score":16,"binary_required_augmented":1,"binary_recommended_augmented":4,"percent_required_fields":1.0,"percent_recommended_fields":0.7619,"conditionsOfAccess":"Open"}}},"amoebadb":{"sourceInfo":{"name":"AmoebaDB","abstract":"AmoebaDB is a NIAID supported IID repository that includes genomic data.","description":"AmoebaDB is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK).These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://amoebadb.org/amoeba/app","identifier":"AmoebaDB","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"},"cryptodb":{"sourceInfo":{"name":"CryptoDB","abstract":"CryptoDB is a NIAID supported IID repository that includes genomic data.","description":"CryptoDB is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://cryptodb.org/cryptodb/app","identifier":"CryptoDB","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"},"giardiadb":{"sourceInfo":{"name":"GiardiaDB","abstract":"GiardiaDB is a NIAID supported IID repository that includes genomic data.","description":"GiardiaDB is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://giardiadb.org/giardiadb/app","identifier":"GiardiaDB","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"},"hostdb":{"sourceInfo":{"name":"HostDB","abstract":"HostDB is a NIAID supported IID repository that includes genomic data.","description":"HostDB is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://hostdb.org/hostdb/app","identifier":"HostDB","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"},"plasmodb":{"sourceInfo":{"name":"PlasmoDB","abstract":"PlasmoDB is a NIAID supported IID repository that includes genomic data.","description":"PlasmoDB is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://plasmodb.org/plasmo/app","identifier":"PlasmoDB","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"},"vectorbase":{"sourceInfo":{"name":"VectorBase","abstract":"VectorBase is a NIAID supported IID repository that includes genomic data.","description":"VectorBase is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://vectorbase.org/vectorbase/app","identifier":"VectorBase","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"},"fungidb":{"sourceInfo":{"name":"FungiDB","abstract":"FungiDB is a NIAID supported IID repository that includes genomic data.","description":"FungiDB is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://fungidb.org/fungidb/app","identifier":"FungiDB","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"},"microsporidiadb":{"sourceInfo":{"name":"MicrosporidiaDB","abstract":"MicrosporidiaDB is a NIAID supported IID repository that includes genomic data.","description":"MicrosporidiaDB is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://microsporidiadb.org/micro/app","identifier":"MicrosporidiaDB","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"},"toxodb":{"sourceInfo":{"name":"ToxoDB","abstract":"ToxoDB is a NIAID supported IID repository that includes genomic data.","description":"ToxoDB is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://toxodb.org/toxo/app","identifier":"ToxoDB","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"},"trichdb":{"sourceInfo":{"name":"TrichDB","abstract":"TrichDB is a NIAID supported IID repository that includes genomic data.","description":"TrichDB is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://trichdb.org/trichdb/app","identifier":"TrichDB","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"},"tritrypdb":{"sourceInfo":{"name":"TriTrypDB","abstract":"TriTrypDB is a NIAID supported IID repository that includes genomic data.","description":"TriTrypDB is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://tritrypdb.org/tritrypdb/app","identifier":"TriTrypDB","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"},"piroplasmadb":{"sourceInfo":{"name":"PiroplasmaDB","abstract":"PiroplasmaDB is a NIAID supported IID repository that includes genomic data.","description":"PiroplasmaDB is a component website of the Eukaryotic Pathogen, Vector and Host Informatics Resource (VEuPathDB) and is constructed using the same infrastructure, data analysis, and loading procedures. VEuPathDB is is one of two bioinformatics Resource Centers (BRCs) funded by the US National Institute of Allergy and Infectious Diseases (NIAID), with additional support from the Wellcome Trust (UK). These resources stem from support initially provided for the Plasmodium Genome Database by the Burroughs Wellcome Fund (2000-2) and a research grant from NIAID (2002-6). The BRC program was initiated in 2004 to provide public access to computational platforms and analysis tools enabling collection, management, integration and mining of genomic information and other large-scale datasets relevant to infectious disease pathogens including their interaction with mammalian hosts and invertebrate vectors of disease.","schema":{"id":"identifer","displayName":"name","contact_name":"author","summary":"description","type":"measurementTechnique","sdPublisher":"project_id","short_attribution":"creditText","release_policy":"conditionOfAccess","version":"dateModified","author":"affiliation","GenomeHistory":"dateUpdated","Version":"datePublished","organism":"species","HyperLinks":"distribution","gene_count":"variableMeasured","gene_type":"GeneTypeCounts"},"url":"https://piroplasmadb.org/piro/app","identifier":"PiroplasmaDB","conditionsOfAccess":"Closed","genre":"IID","parentCollection":{"id":"veupathdb"},"schedule":"Weekly"},"version":"2026-03-28T23:00:13Z"}},"stats":{"total":69953858}}