{"@type": "dcat:Dataset", "accessLevel": "public", "accrualPeriodicity": "irregular", "bureauCode": ["006:55"], "contactPoint": {"fn": "Tyler Laird", "hasEmail": "mailto:tyler.laird@nist.gov"}, "description": "This repository contains the dataset used in the manuscript \"Inter-tool analysis of a NIST dataset for assessing baseline nucleic acid sequence screening\". NIST constructed the test dataset based on the current screening recommendations from HHS. The dataset is a FASTA formatted file with blinded numerical sequence headers. The dataset was sent to sequence screening tool developers for initial testing and to obtain feedback about its utility for assessing baseline sequence screening. An additional metadata file provides the NIST-assigned label for each sequence, along with a more detailed description derived from the source database.", "distribution": [{"description": "A FASTA file of blinded sequences used as a test for assessing baseline sequence screening capabilities of several nucleic acid synthesis screening tools.", "downloadURL": "https://data.nist.gov/od/ds/mds2-3787/NIST_nucleic_acid_synthesis_screening_test_dataset.fasta", "format": "FASTA", "mediaType": "text/plain", "title": "NIST_nucleic_acid_synthesis_screening_test_dataset"}, {"description": "A file with additional information for each sequence in the associated FASTA file", "downloadURL": "https://data.nist.gov/od/ds/mds2-3787/NIST_nucleic_acid_syntheisis_screening_test_dataset_metadata.tsv", "mediaType": "text/tab-separated-values", "title": "NIST_nucleic_acid_syntheisis_screening_test_dataset_metadata"}, {"description": "A README file pertaining to the NIST test dataset for assessing baseline nucleic acid sequence screening.", "downloadURL": "https://data.nist.gov/od/ds/mds2-3787/README.md", "mediaType": "text/markdown", "title": "README"}], "identifier": "ark:/88434/mds2-3787", "issued": "2025-05-21", "keyword": ["Nucleic Acid Synthesis", "Sequence Screening", "DNA", "Biosecurity"], "landingPage": "https://data.nist.gov/od/id/mds2-3787", "language": ["en"], "license": "https://www.nist.gov/open/license", "modified": "2024-08-09 00:00:00", "programCode": ["006:045"], "publisher": {"@type": "org:Organization", "name": "National Institute of Standards and Technology"}, "theme": ["Bioscience:Engineering/synthetic biology", "Public Safety:Chemical/Biological/Radiological/Nuclear/Explosives (CBRNE)", "Bioscience:Biomaterials"], "title": "NIST test dataset for assessing baseline nucleic acid sequence screening"}