feat: 添加 AI Agent 对话测试工具 + 代码优化
主要变更: - 新增 tests/test_ai_chat.py: AI Agent 对话测试工具 - 优化 core/pydantic_ai_agent.py 和 db/chat_log_db.py - 清理归档文件,更新文档 Made-with: Cursor
This commit is contained in:
313
tests/test_ai_chat.py
Normal file
313
tests/test_ai_chat.py
Normal file
@@ -0,0 +1,313 @@
|
||||
"""
|
||||
AI Agent 对话测试脚本
|
||||
从数据库加载聊天记录,测试 AI 回复效果
|
||||
"""
|
||||
import sqlite3
|
||||
import asyncio
|
||||
from datetime import datetime
|
||||
|
||||
# 颜色代码
|
||||
COLORS = {
|
||||
'header': '\033[95m\033[1m',
|
||||
'customer': '\033[94m',
|
||||
'agent': '\033[92m',
|
||||
'system': '\033[90m',
|
||||
'price': '\033[93m',
|
||||
'error': '\033[91m',
|
||||
'cyan': '\033[96m',
|
||||
'reset': '\033[0m',
|
||||
}
|
||||
|
||||
def cprint(text, color='reset'):
|
||||
print(f"{COLORS.get(color, '')}{text}{COLORS['reset']}")
|
||||
|
||||
def check_database():
|
||||
"""检查数据库内容"""
|
||||
db_path = 'db/chat_log_db/chats.db'
|
||||
try:
|
||||
conn = sqlite3.connect(db_path)
|
||||
cursor = conn.execute("SELECT COUNT(*) FROM chat_logs")
|
||||
count = cursor.fetchone()[0]
|
||||
|
||||
if count == 0:
|
||||
cprint(f"\n✗ 数据库为空,没有聊天记录", 'error')
|
||||
cprint("提示:需要先有一些聊天记录才能测试", 'system')
|
||||
conn.close()
|
||||
return None
|
||||
|
||||
cprint(f"\n✓ 数据库连接成功!共 {count} 条聊天记录", 'system')
|
||||
|
||||
# 获取客户列表
|
||||
cursor = conn.execute("""
|
||||
SELECT customer_id, customer_name, COUNT(*) as cnt, MAX(timestamp) as last
|
||||
FROM chat_logs
|
||||
GROUP BY customer_id
|
||||
ORDER BY cnt DESC
|
||||
LIMIT 20
|
||||
""")
|
||||
customers = cursor.fetchall()
|
||||
|
||||
cprint(f"\n找到 {len(customers)} 个客户:", 'cyan')
|
||||
for i, (cid, name, cnt, last) in enumerate(customers, 1):
|
||||
cprint(f" {i:2d}. {name or cid:30s} | {cnt:4d}条 | 最后:{last}", 'customer')
|
||||
|
||||
conn.close()
|
||||
return customers
|
||||
|
||||
except Exception as e:
|
||||
cprint(f"\n✗ 数据库检查失败:{e}", 'error')
|
||||
return None
|
||||
|
||||
async def test_customer_conversation(customer_id, customer_name, limit=5):
|
||||
"""测试某个客户的对话"""
|
||||
cprint(f"\n{'='*70}", 'cyan')
|
||||
cprint(f"测试客户:{customer_name or customer_id}", 'header')
|
||||
cprint(f"{'='*70}\n", 'cyan')
|
||||
|
||||
# 获取对话记录
|
||||
conn = sqlite3.connect('db/chat_log_db/chats.db')
|
||||
cursor = conn.execute("""
|
||||
SELECT direction, message, timestamp
|
||||
FROM chat_logs
|
||||
WHERE customer_id = ?
|
||||
ORDER BY timestamp ASC
|
||||
LIMIT ?
|
||||
""", (customer_id, limit))
|
||||
conversations = cursor.fetchall()
|
||||
conn.close()
|
||||
|
||||
if not conversations:
|
||||
cprint(" 该客户没有对话记录", 'system')
|
||||
return
|
||||
|
||||
# 初始化 AI Agent
|
||||
try:
|
||||
from core.pydantic_ai_agent import CustomerServiceAgent, CustomerMessage
|
||||
agent = CustomerServiceAgent(skills_dir="skills")
|
||||
cprint("✓ AI Agent 已加载", 'system')
|
||||
except Exception as e:
|
||||
cprint(f"✗ AI Agent 加载失败:{e}", 'error')
|
||||
return
|
||||
|
||||
# 模拟对话
|
||||
for i, (direction, message, timestamp) in enumerate(conversations, 1):
|
||||
if direction == 'in':
|
||||
# 客户消息
|
||||
cprint(f"\n【消息 {i}/{len(conversations)}】{timestamp}", 'system')
|
||||
cprint(f"客户:{message}", 'customer')
|
||||
|
||||
# 创建测试消息
|
||||
test_msg = CustomerMessage(
|
||||
msg_id=f"test_{i}",
|
||||
acc_id="test_shop",
|
||||
msg=message,
|
||||
from_id=customer_id,
|
||||
from_name=customer_name or "测试",
|
||||
cy_id=customer_id,
|
||||
acc_type="AliWorkbench",
|
||||
msg_type=0,
|
||||
cy_name=customer_name or "测试",
|
||||
goods_name="专业找图",
|
||||
goods_order=""
|
||||
)
|
||||
|
||||
# 获取 AI 回复
|
||||
start = datetime.now()
|
||||
try:
|
||||
response = await agent.process_message(test_msg)
|
||||
elapsed = (datetime.now() - start).total_seconds() * 1000
|
||||
|
||||
if response.should_reply:
|
||||
cprint(f"AI [{elapsed:.0f}ms]: {response.reply}", 'agent')
|
||||
|
||||
# 检测特殊内容
|
||||
if any(kw in response.reply for kw in ['元', '块', '价格']):
|
||||
cprint(" ↳ [价格信息]", 'price')
|
||||
if response.need_transfer:
|
||||
cprint(" ↳ [转人工]", 'error')
|
||||
else:
|
||||
cprint("[AI 静默]", 'system')
|
||||
|
||||
except Exception as e:
|
||||
cprint(f"✗ AI 回复失败:{e}", 'error')
|
||||
|
||||
elif direction == 'out':
|
||||
cprint(f"\n[历史回复] {timestamp}", 'system')
|
||||
cprint(f"客服:{message}", 'system')
|
||||
|
||||
cprint(f"\n{'='*70}", 'cyan')
|
||||
|
||||
async def test_all_customers(customers, limit_per_customer=5):
|
||||
"""批量测试所有客户"""
|
||||
cprint(f"\n{'='*70}", 'header')
|
||||
cprint(f" 开始批量测试 {len(customers)} 个客户", 'header')
|
||||
cprint(f" 每个客户测试前 {limit_per_customer} 条消息", 'header')
|
||||
cprint(f"{'='*70}\n", 'header')
|
||||
|
||||
total_msgs = 0
|
||||
total_replies = 0
|
||||
|
||||
for i, (cid, name, cnt, _) in enumerate(customers, 1):
|
||||
cprint(f"\n\n{'='*70}", 'cyan')
|
||||
cprint(f"进度:{i}/{len(customers)} - {name or cid} ({cnt}条消息)", 'cyan')
|
||||
cprint(f"{'='*70}", 'cyan')
|
||||
|
||||
if cnt == 0:
|
||||
cprint(" 跳过(无消息记录)", 'system')
|
||||
continue
|
||||
|
||||
# 获取对话记录
|
||||
conn = sqlite3.connect('db/chat_log_db/chats.db')
|
||||
cursor = conn.execute("""
|
||||
SELECT direction, message, timestamp
|
||||
FROM chat_logs
|
||||
WHERE customer_id = ?
|
||||
ORDER BY timestamp ASC
|
||||
LIMIT ?
|
||||
""", (cid, limit_per_customer))
|
||||
conversations = cursor.fetchall()
|
||||
conn.close()
|
||||
|
||||
# 初始化 AI Agent(只初始化一次)
|
||||
try:
|
||||
from core.pydantic_ai_agent import CustomerServiceAgent, CustomerMessage
|
||||
if i == 1: # 第一个客户时初始化
|
||||
agent = CustomerServiceAgent(skills_dir="skills")
|
||||
cprint("✓ AI Agent 已加载", 'system')
|
||||
except Exception as e:
|
||||
cprint(f"✗ AI Agent 加载失败:{e}", 'error')
|
||||
return
|
||||
|
||||
# 模拟对话
|
||||
for j, (direction, message, timestamp) in enumerate(conversations, 1):
|
||||
if direction == 'in':
|
||||
total_msgs += 1
|
||||
|
||||
# 创建测试消息
|
||||
test_msg = CustomerMessage(
|
||||
msg_id=f"test_{i}_{j}",
|
||||
acc_id="test_shop",
|
||||
msg=message,
|
||||
from_id=cid,
|
||||
from_name=name or "测试",
|
||||
cy_id=cid,
|
||||
acc_type="AliWorkbench",
|
||||
msg_type=0,
|
||||
cy_name=name or "测试",
|
||||
goods_name="专业找图",
|
||||
goods_order=""
|
||||
)
|
||||
|
||||
# 获取 AI 回复
|
||||
start = datetime.now()
|
||||
try:
|
||||
response = await agent.process_message(test_msg)
|
||||
elapsed = (datetime.now() - start).total_seconds() * 1000
|
||||
|
||||
if response.should_reply:
|
||||
total_replies += 1
|
||||
cprint(f"\n[{i}/{len(customers)}] {name or cid} - 消息 {j}", 'system')
|
||||
cprint(f"客户:{message}", 'customer')
|
||||
cprint(f"AI [{elapsed:.0f}ms]: {response.reply}", 'agent')
|
||||
|
||||
# 检测特殊内容
|
||||
if any(kw in response.reply for kw in ['元', '块', '价格']):
|
||||
cprint(" ↳ [价格信息]", 'price')
|
||||
if response.need_transfer:
|
||||
cprint(" ↳ [转人工]", 'error')
|
||||
else:
|
||||
cprint(f"\n[{i}/{len(customers)}] [AI 静默]", 'system')
|
||||
|
||||
except Exception as e:
|
||||
cprint(f"✗ AI 回复失败:{e}", 'error')
|
||||
|
||||
# 每个客户之间休息一下
|
||||
await asyncio.sleep(0.5)
|
||||
|
||||
# 统计结果
|
||||
cprint(f"\n\n{'='*70}", 'header')
|
||||
cprint(f" 批量测试完成!", 'header')
|
||||
cprint(f"{'='*70}", 'header')
|
||||
cprint(f"\n统计:", 'system')
|
||||
cprint(f" 测试客户数:{len(customers)}", 'cyan')
|
||||
cprint(f" 处理消息数:{total_msgs}", 'cyan')
|
||||
cprint(f" AI 回复数:{total_replies}", 'cyan')
|
||||
if total_msgs > 0:
|
||||
reply_rate = (total_replies / total_msgs) * 100
|
||||
cprint(f" 回复率:{reply_rate:.1f}%", 'cyan')
|
||||
|
||||
async def main():
|
||||
cprint("="*70, 'header')
|
||||
cprint(" AI Agent 对话测试", 'header')
|
||||
cprint(" 从数据库加载聊天记录,测试 AI 回复效果", 'header')
|
||||
cprint("="*70, 'header')
|
||||
|
||||
# 检查数据库
|
||||
customers = check_database()
|
||||
if not customers:
|
||||
return
|
||||
|
||||
# 选择测试模式
|
||||
cprint(f"\n请选择测试模式:", 'cyan')
|
||||
cprint(f" 1. 交互式测试 (手动选择客户)", 'customer')
|
||||
cprint(f" 2. 批量测试所有客户 (自动)", 'agent')
|
||||
cprint(f" 3. 快速测试前 5 个客户", 'price')
|
||||
cprint(f" q. 退出", 'system')
|
||||
|
||||
mode = input("\n选择:").strip().lower()
|
||||
|
||||
if mode == 'q':
|
||||
cprint("\n测试结束!", 'system')
|
||||
return
|
||||
|
||||
try:
|
||||
if mode == '1':
|
||||
# 交互式测试
|
||||
cprint(f"\n请输入客户编号 (1-{len(customers)}) 进行测试:", 'cyan')
|
||||
|
||||
while True:
|
||||
try:
|
||||
choice = input("\n选择:").strip()
|
||||
|
||||
if choice.lower() == 'q':
|
||||
cprint("\n测试结束!", 'system')
|
||||
return
|
||||
|
||||
choice_num = int(choice)
|
||||
if 1 <= choice_num <= len(customers):
|
||||
cid, name, cnt, _ = customers[choice_num - 1]
|
||||
await test_customer_conversation(cid, name or cid, limit=min(cnt, 10))
|
||||
else:
|
||||
cprint(f"请输入 1-{len(customers)} 之间的数字", 'error')
|
||||
|
||||
except ValueError:
|
||||
cprint("请输入有效数字或 q 退出", 'error')
|
||||
except KeyboardInterrupt:
|
||||
cprint("\n\n测试中断", 'error')
|
||||
return
|
||||
except Exception as e:
|
||||
cprint(f"错误:{e}", 'error')
|
||||
|
||||
elif mode == '2':
|
||||
# 批量测试所有客户
|
||||
await test_all_customers(customers, limit_per_customer=5)
|
||||
|
||||
elif mode == '3':
|
||||
# 快速测试前 5 个客户
|
||||
top_5 = customers[:5]
|
||||
cprint(f"\n快速测试前 5 个客户...", 'cyan')
|
||||
await test_all_customers(top_5, limit_per_customer=5)
|
||||
|
||||
else:
|
||||
cprint("无效的选择", 'error')
|
||||
|
||||
except KeyboardInterrupt:
|
||||
cprint("\n\n测试中断", 'error')
|
||||
except Exception as e:
|
||||
cprint(f"错误:{e}", 'error')
|
||||
|
||||
if __name__ == "__main__":
|
||||
try:
|
||||
asyncio.run(main())
|
||||
except Exception as e:
|
||||
cprint(f"\n程序异常:{e}", 'error')
|
||||
Reference in New Issue
Block a user