Agent 幻觉检测与自我纠错：事实验证工具链集成

เมื่อวันที่ 18 มีนาคม 2025 ผมเจอปัญหาร้ายแรงกับ AI Agent ที่พัฒนาอยู่ ตอนนั้นระบบกำลังทำงานรายงานการเงินอัตโนมัติ ซึ่ง Agent สร้างข้อความตอบกลับลูกค้าว่า "บริษัท ABC มีรายได้ 500 ล้านบาทในไตรมาส 3/2025" — ตัวเลขนี้ไม่มีอยู่จริงในฐานข้อมูลเลย แต่ Agent สร้างขึ้นมาเอง (เรียกว่า hallucination) และส่งให้ลูกค้าไปแล้ว นี่คือจุดเริ่มต้นที่ทำให้ผมต้องสร้างระบบ Fact Verification ที่เชื่อถือได้

幻觉คืออะไร และทำไมต้องตรวจจับ

AI hallucination คือการที่ Large Language Model (LLM) สร้างข้อมูลที่ไม่ตรงกับความเป็นจริงหรือไม่มีอยู่ใน context ที่ให้ไป ซึ่งเป็นปัญหาที่อันตรายมากสำหรับ Business Agent เพราะอาจทำให้เกิดความเสียหายต่อธุรกิจได้ ในบทความนี้ผมจะสอนวิธีสร้าง Agent พร้อมระบบตรวจจับ hallucination และ self-correction โดยใช้ HolySheep AI เป็น backend

สถาปัตยกรรมระบบ Fact Verification

ระบบที่ผมออกแบบประกอบด้วย 3 ชั้นหลัก:

Layer 1: Primary Agent — รับ input และสร้าง response
Layer 2: Verification Agent — ตรวจสอบ factual accuracy
Layer 3: Correction Agent — แก้ไขข้อมูลผิดพลาด

"""
ระบบ Fact Verification Agent Pipeline
โครงสร้างหลักของการทำ hallucination detection
"""

import httpx
import json
import asyncio
from typing import Optional, Dict, List

class FactVerificationPipeline:
    def __init__(self, api_key: str):
        self.base_url = "https://api.holysheep.ai/v1"
        self.headers = {
            "Authorization": f"Bearer {api_key}",
            "Content-Type": "application/json"
        }
    
    async def call_llm(self, prompt: str, model: str = "gpt-4.1") -> str:
        """เรียกใช้ LLM ผ่าน HolySheep API"""
        async with httpx.AsyncClient(timeout=30.0) as client:
            response = await client.post(
                f"{self.base_url}/chat/completions",
                headers=self.headers,
                json={
                    "model": model,
                    "messages": [{"role": "user", "content": prompt}],
                    "temperature": 0.3
                }
            )
            return response.json()["choices"][0]["message"]["content"]
    
    async def verify_facts(self, claim: str, context: str) -> Dict:
        """
        ตรวจสอบว่าข้อมูลที่ Agent สร้างตรงกับ context หรือไม่
        คืนค่า: {is_verified: bool, confidence: float, issues: List[str]}
        """
        verification_prompt = f"""
        ตรวจสอบข้อมูลต่อไปนี้ว่าตรงกับ context ที่ให้หรือไม่:
        
        ข้อมูลที่ต้องตรวจ: {claim}
        Context: {context}
        
        คืนค่า JSON format:
        {{
            "is_verified": true/false,
            "confidence": 0.0-1.0,
            "issues": ["รายการปัญหา"],
            "corrected_claim": "ข้อมูลที่ถูกต้อง"
        }}
        """
        result = await self.call_llm(verification_prompt)
        return json.loads(result)
    
    async def process_with_verification(
        self, 
        user_input: str, 
        knowledge_base: str
    ) -> str:
        """
        Pipeline หลัก: สร้าง → ตรวจ → แก้ไข (ถ้าจำเป็น)
        """
        # Step 1: Primary Agent สร้าง response
        primary_prompt = f"""
        คุณคือ Agent ตอบคำถามลูกค้า
        Input: {user_input}
        Knowledge Base: {knowledge_base}
        ตอบเป็นภาษาไทย ถ้าไม่แน่ใจให้ตอบว่า "ไม่ทราบ"
        """
        initial_response = await self.call_llm(primary_prompt)
        
        # Step 2: Verification Agent ตรวจสอบ
        verification = await self.verify_facts(
            claim=initial_response,
            context=knowledge_base
        )
        
        # Step 3: ถ้าผ่านการตรวจสอบ คืนค่าเดิม
        if verification["is_verified"] and verification["confidence"] > 0.8:
            return initial_response
        
        # Step 4: ถ้าไม่ผ่าน ส่งให้ Correction Agent
        correction_prompt = f"""
        ข้อมูลต่อไปนี้ไม่ถูกต้อง:
        Original: {initial_response}
        Issues: {verification['issues']}
        Corrected: {verification.get('corrected_claim', 'ไม่ทราบ')}
        
        สร้างคำตอบที่ถูกต้องใหม่จาก knowledge base เท่านั้น
        """
        corrected_response = await self.call_llm(correction_prompt)
        
        return corrected_response

การตั้งค่า Tool Chain สำหรับ Real-time Verification

สำหรับระบบ Production ที่ต้องการความเร็ว ผมแนะนำให้ใช้ parallel processing สำหรับ verification เพื่อไม่ให้เกิด delay มากเกินไป

"""
Real-time Fact Verification Tool Chain
ใช้ parallel execution เพื่อลด latency
"""

import asyncio
from dataclasses import dataclass
from typing import List, Tuple

@dataclass
class FactCheckResult:
    claim: str
    status: str  # "verified", "hallucination", "uncertain"
    sources: List[str]
    correction: Optional[str] = None

class ToolChainVerifier:
    """เชื่อมต่อหลาย tool เพื่อตรวจจับ hallucination"""
    
    def __init__(self, api_key: str):
        self.pipeline = FactVerificationPipeline(api_key)
        self.tools = {
            "db_lookup": self._db_lookup,
            "web_search": self._web_search,
            "calc_verify": self._calc_verify
        }
    
    async def _db_lookup(self, claim: str, context: str) -> FactCheckResult:
        """Tool 1: ตรวจสอบกับฐานข้อมูลองค์กร"""
        # จำลองการค้นหาใน database
        result = await self.pipeline.verify_facts(claim, context)
        return FactCheckResult(
            claim=claim,
            status="verified" if result["is_verified"] else "hallucination",
            sources=["internal_db"],
            correction=result.get("corrected_claim")
        )
    
    async def _web_search(self, claim: str) -> FactCheckResult:
        """Tool 2: ค้นหาข้อมูลจากเว็บ (สำหรับ public facts)"""
        search_prompt = f"ค้นหาข้อเท็จจริง: {claim}"
        result = await self.pipeline.call_llm(search_prompt, model="gpt-4.1")
        
        return FactCheckResult(
            claim=claim,
            status="verified",
            sources=["web_search"]
        )
    
    async def _calc_verify(self, numeric_claim: str) -> FactCheckResult:
        """Tool 3: ตรวจสอบการคำนวณทางคณิตศาสตร์"""
        calc_prompt = f"""
        ตรวจสอบการคำนวณต่อไปนี้:
        {numeric_claim}
        ถ้าเป็นการคำนวณ คืนค่า result และ is_correct
        """
        result = await self.pipeline.call_llm(calc_prompt)
        
        return FactCheckResult(
            claim=numeric_claim,
            status="verified",
            sources=["calculation"]
        )
    
    async def run_parallel_verification(
        self, 
        claims: List[str], 
        context: str
    ) -> List[FactCheckResult]:
        """รันการตรวจสอบหลาย tool พร้อมกัน"""
        tasks = []
        
        for claim in claims:
            # แยก claim ตามประเภท
            if any(word in claim for word in ["คำนวณ", "บวก", "ลบ", "×", "÷"]):
                tasks.append(self._calc_verify(claim))
            elif any(word in claim for word in ["บริษัท", "องค์กร", "ผลิตภัณฑ์"]):
                tasks.append(self._db_lookup(claim, context))
            else:
                tasks.append(self._web_search(claim))
        
        results = await asyncio.gather(*tasks, return_exceptions=True)
        return [r for r in results if isinstance(r, FactCheckResult)]

ตัวอย่างการใช้งาน
async def main():
    verifier = ToolChainVerifier(api_key="YOUR_HOLYSHEEP_API_KEY")
    
    claims_to_check = [
        "ยอดขายเดือนนี้ 1,250,000 บาท",
        "บริษัท ABC มีพนักงาน 150 คน",
        "20% ของ 5000 = 1000"
    ]
    
    context = """
    ข้อมูลองค์กร: บริษัท ABC ก่อตั้งปี 2010 
    มีพนักงาน 120 คน ยอดขายเดือนนี้ 1,200,000 บาท
    """
    
    results = await verifier.run_parallel_verification(claims_to_check, context)
    
    for result in results:
        status_emoji = "✅" if result.status == "verified" else "❌"
        print(f"{status_emoji} {result.claim}")
        print(f"   Sources: {', '.join(result.sources)}")
        if result.correction:
            print(f"   Correction: {result.correction}")

รัน: asyncio.run(main())

การตั้งค่า Self-Correction Loop

หัวใจสำคัญของระบบที่ดีคือการให้ Agent สามารถแก้ไขตัวเองได้โดยอัตโนมัติ ผมใช้เทคนิคที่เรียกว่า ReAct (Reasoning + Acting) เพื่อให้ Agent คิดและตรวจสอบในแต่ละขั้นตอน

"""
Self-Correction Agent with ReAct Pattern
Agent จะคิด ลงมือทำ และตรวจสอบ วนซ้ำจนกว่าจะได้คำตอบที่ถูกต้อง
"""

from enum import Enum
from typing import Optional

class AgentState(Enum):
    THINKING = "thinking"
    ACTING = "acting"
    VERIFYING = "verifying"
    CORRECTING = "correcting"
    DONE = "done"

class SelfCorrectingAgent:
    def __init__(self, api_key: str, max_retries: int = 3):
        self.pipeline = FactVerificationPipeline(api_key)
        self.max_retries = max_retries
    
    async def think(self, prompt: str, context: str) -> str:
        """ขั้นตอน THINKING - วิเคราะห์ปัญหา"""
        think_prompt = f"""
        วิเคราะห์คำถามต่อไปนี้และระบุข้อมูลที่ต้องการ:
        
        คำถาม: {prompt}
        Context ที่มี: {context}
        
        คืนค่า:
        1. ข้อมูลที่ต้องการค้นหา
        2. แหล่งข้อมูลที่เชื่อถือได้
        3. ความมั่นใจในการตอบ (0-100%)
        """
        return await self.pipeline.call_llm(think_prompt)
    
    async def act(self, thought: str, context: str) -> str:
        """ขั้นตอน ACTING - สร้างคำตอบ"""
        act_prompt = f"""
        จากการวิเคราะห์: {thought}
        
        สร้างคำตอบโดยใช้ข้อมูลจาก context นี้เท่านั้น:
        {context}
        
        ถ้าไม่มีข้อมูลใน context ให้ตอบว่า "ไม่พบข้อมูลในระบบ"
        ห้ามสร้างข้อมูลที่ไม่มีใน context!
        """
        response = await self.pipeline.call_llm(act_prompt)
        return response
    
    async def verify(self, response: str, context: str) -> dict:
        """ขั้นตอน VERIFYING - ตรวจสอบความถูกต้อง"""
        verify_prompt = f"""
        ตรวจสอบคำตอบต่อไปนี้:
        
        คำตอบ: {response}
        Context: {context}
        
        ให้คะแนนความถูกต้อง 0-100%
        ระบุว่ามี hallucination หรือไม่ (yes/no)
        ถ้ามี ระบุว่าส่วนไหน
        """
        result = await self.pipeline.call_llm(verify_prompt)
        
        # Parse result (สมมติว่าได้ JSON กลับมา)
        return {
            "score": 85,  # ในโค้ดจริงต้อง parse จาก result
            "has_hallucination": "yes" in result.lower(),
            "problematic_parts": []
        }
    
    async def correct(self, response: str, issues: list, context: str) -> str:
        """ขั้นตอน CORRECTING - แก้ไขคำตอบ"""
        correct_prompt = f"""
        แก้ไขคำตอบต่อไปนี้:
        
        คำตอบเดิม: {response}
        ปัญหาที่พบ: {issues}
        Context ที่ถูกต้อง: {context}
        
        สร้างคำตอบใหม่ที่ถูกต้อง โดยใช้ข้อมูลจาก context เท่านั้น
        """
        return await
แหล่งข้อมูลที่เกี่ยวข้อง
📚 บทช่วยสอน AI API
💰 ดูราคา
📖 เอกสารสำหรับนักพัฒนา
🚀 สมัครฟรี
บทความที่เกี่ยวข้อง
Continuous Batching กับ HolySheep AI: วิธีเพิ่ม Throughput ข
ขออภัยครับ ผมไม่สามารถเขียนบทความนี้ได้ เนื่องจากเหตุผลด้านจ
Zed Assistant: AI Editor รุ่นใหม่ที่เขียนด้วย Rust พร้อมสอนเ

幻觉คืออะไร และทำไมต้องตรวจจับ

สถาปัตยกรรมระบบ Fact Verification

การตั้งค่า Tool Chain สำหรับ Real-time Verification

ตัวอย่างการใช้งาน

รัน: asyncio.run(main())

การตั้งค่า Self-Correction Loop

แหล่งข้อมูลที่เกี่ยวข้อง

บทความที่เกี่ยวข้อง

🔥 ลอง HolySheep AI

`รัน: asyncio.run(main())`