Skip to content

Commit bc51db9

Browse files
committed
feat: add tool metrics
1 parent 8dee6e5 commit bc51db9

File tree

5 files changed

+4831
-16
lines changed

5 files changed

+4831
-16
lines changed

agent.py

Lines changed: 51 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,51 @@
1+
from veadk import Agent, Runner
2+
from veadk.config import getenv
3+
from veadk.knowledgebase import KnowledgeBase
4+
from veadk.memory.long_term_memory import LongTermMemory
5+
from veadk.memory.short_term_memory import ShortTermMemory
6+
from veadk.tools.builtin_tools.web_search import web_search
7+
from veadk.tools.demo_tools import get_city_weather
8+
from veadk.tracing.telemetry.exporters.apmplus_exporter import APMPlusExporter
9+
from veadk.tracing.telemetry.exporters.cozeloop_exporter import CozeloopExporter
10+
from veadk.tracing.telemetry.exporters.tls_exporter import TLSExporter
11+
from veadk.tracing.telemetry.opentelemetry_tracer import OpentelemetryTracer
12+
13+
tracer = OpentelemetryTracer(
14+
exporters=[
15+
# CozeloopExporter(),
16+
APMPlusExporter(),
17+
TLSExporter(),
18+
]
19+
)
20+
21+
agent = Agent(
22+
name="test",
23+
tracers=[tracer],
24+
tools=[get_city_weather],
25+
# long_term_memory=LongTermMemory(backend="local"),
26+
# knowledgebase=KnowledgeBase(backend="local", app_name="veadk_default_app"),
27+
)
28+
29+
short_term_memory = ShortTermMemory()
30+
31+
runner = Runner(agent=agent, short_term_memory=short_term_memory)
32+
33+
import asyncio
34+
35+
for i in range(0, 300):
36+
res = asyncio.run(
37+
runner.run(
38+
messages="搜索我的记忆、知识库,看看能不能获取到北京天气",
39+
session_id="test_session",
40+
save_tracing_data=False,
41+
)
42+
)
43+
44+
print(res)
45+
46+
import time
47+
48+
time.sleep(5)
49+
50+
51+
# print(getenv("MODEL_AGENT_EXTRA_CONFIG"))

deep_eval_test.py

Lines changed: 21 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,21 @@
1+
2+
import pytest
3+
from deepeval import assert_test
4+
from deepeval.metrics import GEval
5+
from deepeval.test_case import LLMTestCase, LLMTestCaseParams
6+
7+
def test_case():
8+
correctness_metric = GEval(
9+
name="Correctness",
10+
criteria="Determine if the 'actual output' is correct based on the 'expected output'.",
11+
evaluation_params=[LLMTestCaseParams.ACTUAL_OUTPUT, LLMTestCaseParams.EXPECTED_OUTPUT],
12+
threshold=0.5
13+
)
14+
test_case = LLMTestCase(
15+
input="What if these shoes don't fit?",
16+
# Replace this with the actual output from your LLM application
17+
actual_output="You have 30 days to get a full refund at no extra cost.",
18+
expected_output="We offer a 30-day full refund at no extra costs.",
19+
retrieval_context=["All customers are eligible for a 30 day full refund at no extra costs."]
20+
)
21+
assert_test(test_case, [correctness_metric])

0 commit comments

Comments
 (0)