{
  "_schema": "https://data.nist.gov/od/dm/nerdm-schema/v0.7#",
  "@context": [
    "https://data.nist.gov/od/dm/nerdm-pub-context.jsonld",
    {
      "@base": "ark:/88434/mds2-2545"
    }
  ],
  "@type": [
    "nrdp:PublicDataResource",
    "dcat:Dataset"
  ],
  "_extensionSchemas": [
    "https://data.nist.gov/od/dm/nerdm-schema/pub/v0.7#/definitions/PublicDataResource"
  ],
  "@id": "ark:/88434/mds2-2545",
  "ediid": "ark:/88434/mds2-2545",
  "version": "1.1.1",
  "doi": "doi:10.18434/mds2-2545",
  "title": "TV_VTT (TrecVid Video-To-Text) Dataset",
  "contactPoint": {
    "fn": "George Awad",
    "hasEmail": "mailto:george.awad@nist.gov"
  },
  "modified": "2025-01-06 00:00:00",
  "status": "available",
  "landingPage": "https://data.nist.gov/od/id/mds2-2545",
  "description": [
    "This dataset contains short videos (ranging from 3 seconds to 10 seconds) from TRECVID VTT task from 2016 to 2024. There are 73,893 videos with captions. Each video has between 2 and 5 captions, which have been written by dedicated annotators hired by NIST."
  ],
  "keyword": [
    "video captioning",
    "video retrieval",
    "video to text",
    "image captioning"
  ],
  "theme": [
    "Information Technology: Data and informatics"
  ],
  "topic": [
    {
      "@type": "Concept",
      "scheme": "https://data.nist.gov/od/dm/nist-themes/v1.1",
      "tag": "Information Technology: Data and informatics"
    }
  ],
  "accessLevel": "public",
  "license": "https://www.nist.gov/open/license",
  "components": [
    {
      "accessURL": "https://ir.nist.gov/tv_vtt_data/",
      "format": {
        "description": "videos are in mp4 and captions are in plain text."
      },
      "description": "This dataset contains short videos (ranging from 3 seconds to 10 seconds) from TRECVID VTT task from 2016 to 2021. There are 10,862 videos with captions. Each video has between 2 and 5 captions, which have been written by dedicated annotators hired by NIST.",
      "title": "TV_VTT",
      "@type": [
        "nrdp:AccessPage",
        "dcat:Distribution"
      ],
      "@id": "#tv_vtt_data/",
      "_extensionSchemas": [
        "https://data.nist.gov/od/dm/nerdm-schema/pub/v0.7#/definitions/AccessPage"
      ]
    },
    {
      "accessURL": "https://ir.nist.gov/tv_vtt_data/Readme.txt",
      "format": {
        "description": "txt"
      },
      "description": "A high-level readme file explaining how the dataset (videos and captions) are organized.",
      "title": "Readme",
      "@type": [
        "nrdp:AccessPage",
        "dcat:Distribution"
      ],
      "@id": "#tv_vtt_data/Readme.txt",
      "_extensionSchemas": [
        "https://data.nist.gov/od/dm/nerdm-schema/pub/v0.7#/definitions/AccessPage"
      ]
    },
    {
      "accessURL": "https://doi.org/10.18434/mds2-2545",
      "title": "DOI Access for TV_VTT (TrecVid Video-To-Text) Dataset",
      "@type": [
        "nrd:Hidden",
        "dcat:Distribution"
      ],
      "@id": "#doi:10.18434/mds2-2545"
    },
    {
      "@id": "cmps/V3C_VTT_Org.Form.txt",
      "@type": [
        "nrdp:DataFile",
        "nrdp:DownloadableFile",
        "dcat:Distribution"
      ],
      "_extensionSchemas": [
        "https://data.nist.gov/od/dm/nerdm-schema/pub/v0.7#/definitions/DataFile"
      ],
      "filepath": "V3C_VTT_Org.Form.txt",
      "downloadURL": "https://data.nist.gov/od/ds/mds2-2545/V3C_VTT_Org.Form.txt",
      "mediaType": "text/plain",
      "format": {
        "description": "text file"
      },
      "description": "Please submit the following data agreement form to access the TV_VTT (video to text development dataset)",
      "title": "data agreement form",
      "size": 3430,
      "checksum": {
        "hash": "33dce25e823f089345bcb049e80bd32d78e9ef903c1e017a775474b9dccfe319",
        "algorithm": {
          "tag": "sha256",
          "@type": "Thing"
        }
      }
    }
  ],
  "publisher": {
    "name": "National Institute of Standards and Technology",
    "@type": "org:Organization"
  },
  "language": [
    "en"
  ],
  "bureauCode": [
    "006:55"
  ],
  "programCode": [
    "006:052"
  ],
  "annotated": "2025-01-06T23:15:36.402416",
  "revised": "2023-01-27T21:49:04.040824",
  "issued": "2022-02-14T17:03:57",
  "firstIssued": "2022-02-14T22:03:54.112389",
  "releaseHistory": {
    "@id": "ark:/88434/mds2-2545.rel",
    "@type": [
      "nrdr:ReleaseHistory"
    ],
    "hasRelease": [
      {
        "version": "1.0.0",
        "issued": "2021-10-01 00:00:00",
        "@id": "ark:/88434/mds2-2545/pdr:v/1.0.0",
        "location": "https://data.nist.gov/od/id/ark:/88434/mds2-2545/pdr:v/1.0.0",
        "description": "initial release"
      },
      {
        "version": "1.0.1",
        "issued": "2021-10-01 00:00:00",
        "@id": "ark:/88434/mds2-2545/pdr:v/1.0.1",
        "location": "https://data.nist.gov/od/id/ark:/88434/mds2-2545/pdr:v/1.0.1",
        "description": "metadata update"
      },
      {
        "version": "1.1.0",
        "issued": "2021-10-01 00:00:00",
        "@id": "ark:/88434/mds2-2545/pdr:v/1.1.0",
        "location": "https://data.nist.gov/od/id/ark:/88434/mds2-2545/pdr:v/1.1.0",
        "description": "data update"
      },
      {
        "version": "1.1.1",
        "issued": "2025-01-06 00:00:00",
        "@id": "ark:/88434/mds2-2545/pdr:v/1.1.1",
        "location": "https://data.nist.gov/od/id/ark:/88434/mds2-2545/pdr:v/1.1.1",
        "description": "metadata update"
      }
    ]
  }
}