{"@type": "dcat:Dataset", "accessLevel": "public", "accrualPeriodicity": "R/P1Y", "bureauCode": ["006:55"], "contactPoint": {"fn": "George Awad", "hasEmail": "mailto:george.awad@nist.gov"}, "description": "This dataset contains short videos (ranging from 3 seconds to 10 seconds) from TRECVID VTT task from 2016 to 2024. There are 73,893 videos with captions. Each video has between 2 and 5 captions, which have been written by dedicated annotators hired by NIST.", "distribution": [{"accessURL": "https://doi.org/10.18434/mds2-2545", "title": "DOI Access for TV_VTT (TrecVid Video-To-Text) Dataset"}, {"accessURL": "https://ir.nist.gov/tv_vtt_data/", "description": "This dataset contains short videos (ranging from 3 seconds to 10 seconds) from TRECVID VTT task from 2016 to 2021. There are 10,862 videos with captions. Each video has between 2 and 5 captions, which have been written by dedicated annotators hired by NIST.", "format": "videos are in mp4 and captions are in plain text.", "title": "TV_VTT"}, {"accessURL": "https://ir.nist.gov/tv_vtt_data/Readme.txt", "description": "A high-level readme file explaining how the dataset (videos and captions) are organized.", "format": "txt", "title": "Readme"}, {"description": "Please submit the following data agreement form to access the TV_VTT (video to text development dataset)", "downloadURL": "https://data.nist.gov/od/ds/mds2-2545/V3C_VTT_Org.Form.txt", "format": "text file", "mediaType": "text/plain", "title": "data agreement form"}], "identifier": "ark:/88434/mds2-2545", "issued": "2022-02-14", "keyword": ["image captioning", "video captioning", "video retrieval", "video to text"], "landingPage": "https://data.nist.gov/od/id/mds2-2545", "language": ["en"], "license": "https://www.nist.gov/open/license", "modified": "2025-01-06 00:00:00", "programCode": ["006:045"], "publisher": {"@type": "org:Organization", "name": "National Institute of Standards and Technology"}, "theme": ["Information Technology:Data and informatics"], "title": "TV_VTT (TrecVid Video-To-Text) Dataset"}