{
  "apiVersion": "v1",
  "methodology": "https://sourcescore.org/methodology/",
  "canonical": "https://sourcescore.org/claims/e942c93d70a4dab2/",
  "claim": {
    "vertical": "ai-ml",
    "subject": "Byte-Pair Encoding (BPE) for Neural Machine Translation",
    "predicate": "introduced_in_paper",
    "object": "Neural Machine Translation of Rare Words with Subword Units (Sennrich et al., 2015)",
    "confidence": 1,
    "sources": [
      {
        "url": "https://arxiv.org/abs/1508.07909",
        "title": "Neural Machine Translation of Rare Words with Subword Units",
        "publisher": "arXiv (Sennrich, Haddow, Birch)",
        "publishedDate": "2015-08-31",
        "accessedDate": "2026-05-16",
        "type": "preprint",
        "excerpt": "We introduce a simpler and more effective approach, making the NMT model capable of open-vocabulary translation by encoding rare and unknown words as sequences of subword units."
      },
      {
        "url": "https://aclanthology.org/P16-1162/",
        "title": "Neural Machine Translation of Rare Words with Subword Units (ACL 2016)",
        "publisher": "Association for Computational Linguistics",
        "publishedDate": "2016-08-07",
        "accessedDate": "2026-05-16",
        "type": "peer-reviewed"
      }
    ],
    "publishedAt": "2026-05-16T00:00:00Z",
    "lastVerified": "2026-05-16",
    "methodologyVersion": "veritas-v0.1",
    "tags": [
      "bpe",
      "tokenization",
      "foundational",
      "sennrich",
      "2015",
      "acl",
      "nmt"
    ],
    "id": "e942c93d70a4dab2",
    "statement": "Byte-Pair Encoding (BPE) for Neural Machine Translation introduced in paper: Neural Machine Translation of Rare Words with Subword Units (Sennrich et al., 2015)."
  },
  "signature": {
    "algorithm": "HMAC-SHA256",
    "signedBy": "did:web:sourcescore.org",
    "signedAt": "2026-05-16T00:00:00.000Z",
    "signature": "f5a009459900288874d41e8ee2a99e6965431dbf4f66fce90d079bf69a8825fb"
  },
  "citedAs": "Byte-Pair Encoding (BPE) for Neural Machine Translation introduced in paper: Neural Machine Translation of Rare Words with Subword Units (Sennrich et al., 2015). — SourceScore Claim e942c93d70a4dab2 (verified 2026-05-16, signed f5a00945…). https://sourcescore.org/claims/e942c93d70a4dab2/"
}