@prefix schema: <https://schema.org/> .
@prefix af: <https://anchorfact.org/ns#> .

<https://anchorfact.org/kb/ai/llm-evaluation-tau-bench-tool-agent-benchmarks>
  a schema:TechArticle ;
  schema:headline "LLM Evaluation Tau-bench Tool-Agent Benchmarks" ;
  schema:url <https://anchorfact.org/ai/llm-evaluation-tau-bench-tool-agent-benchmarks/> ;
  af:status "public" ;
  af:confidence "medium" ;
  af:confidenceScore "0.685" ;
  af:confidenceBasis "verified_sources" ;
  af:generationMethod "ai_structured" .

<https://anchorfact.org/kb/ai/llm-evaluation-tau-bench-tool-agent-benchmarks>
  schema:citation <https://arxiv.org/abs/2406.12045> ;
  af:sourceTier "C" .

<https://anchorfact.org/kb/ai/llm-evaluation-tau-bench-tool-agent-benchmarks>
  schema:citation <https://github.com/sierra-research/tau-bench> ;
  af:sourceTier "B" .