{
  "apiVersion": "v1",
  "methodology": "https://sourcescore.org/methodology/",
  "canonical": "https://sourcescore.org/claims/5da8f8dffc038b8e/",
  "claim": {
    "vertical": "ai-ml",
    "subject": "InstructGPT methodology",
    "predicate": "introduced_in_paper",
    "object": "Training language models to follow instructions with human feedback (Ouyang et al., 2022)",
    "confidence": 1,
    "sources": [
      {
        "url": "https://arxiv.org/abs/2203.02155",
        "title": "Training language models to follow instructions with human feedback",
        "publisher": "arXiv (Ouyang et al., OpenAI)",
        "publishedDate": "2022-03-04",
        "accessedDate": "2026-05-16",
        "type": "preprint",
        "excerpt": "We show an avenue for aligning language models with user intent on a wide range of tasks by fine-tuning with human feedback. … The resulting InstructGPT models show improvements in truthfulness and reductions in toxic output generation while having minimal performance regressions on public NLP datasets."
      },
      {
        "url": "https://openai.com/research/instruction-following",
        "title": "Aligning language models to follow instructions",
        "publisher": "OpenAI",
        "publishedDate": "2022-01-27",
        "accessedDate": "2026-05-16",
        "type": "official-blog"
      }
    ],
    "publishedAt": "2026-05-16T00:00:00Z",
    "lastVerified": "2026-05-16",
    "methodologyVersion": "veritas-v0.1",
    "tags": [
      "instructgpt",
      "alignment",
      "openai",
      "2022",
      "ouyang",
      "rlhf"
    ],
    "id": "5da8f8dffc038b8e",
    "statement": "InstructGPT methodology introduced in paper: Training language models to follow instructions with human feedback (Ouyang et al., 2022)."
  },
  "signature": {
    "algorithm": "HMAC-SHA256",
    "signedBy": "did:web:sourcescore.org",
    "signedAt": "2026-05-16T00:00:00.000Z",
    "signature": "76b8d2a8b34d06a65a0cb02f0321d0a373c5c21bf511bce71cd2cb646d1e19bd"
  },
  "citedAs": "InstructGPT methodology introduced in paper: Training language models to follow instructions with human feedback (Ouyang et al., 2022). — SourceScore Claim 5da8f8dffc038b8e (verified 2026-05-16, signed 76b8d2a8…). https://sourcescore.org/claims/5da8f8dffc038b8e/"
}