@prefix schema: <https://schema.org/> .
@prefix af: <https://anchorfact.org/ns#> .

<https://anchorfact.org/kb/ai/rlhf>
  a schema:TechArticle ;
  schema:headline "Reinforcement Learning from Human Feedback (RLHF)" ;
  schema:url <https://anchorfact.org/ai/rlhf/> ;
  af:status "public" ;
  af:confidence "medium" ;
  af:confidenceScore "0.855" ;
  af:confidenceBasis "verified_sources" ;
  af:generationMethod "ai_structured" .

<https://anchorfact.org/kb/ai/rlhf>
  schema:citation <https://arxiv.org/abs/1706.03741> ;
  af:sourceTier "S" .

<https://anchorfact.org/kb/ai/rlhf>
  schema:citation <https://arxiv.org/abs/2203.02155> ;
  af:sourceTier "S" .

<https://anchorfact.org/kb/ai/rlhf>
  schema:citation <https://arxiv.org/abs/2305.18290> ;
  af:sourceTier "S" .