From dbecd34fa855b30008af489abb2004e59c3e7957 Mon Sep 17 00:00:00 2001
From: Samuel Colvin <s@muelcolvin.com>
Date: Thu, 24 Oct 2024 14:38:33 +0100
Subject: [PATCH] adding rag example

---
 .gitignore          |   1 +
 examples/rag.py     | 252 ++++++++++++++++++++++++++++++++++++++++++++
 examples/sql_gen.py |   1 +
 pyproject.toml      |   2 +-
 uv.lock             |  23 +++-
 5 files changed, 276 insertions(+), 3 deletions(-)
 create mode 100644 examples/rag.py

diff --git a/.gitignore b/.gitignore
index f7cc9b3d4..3714644e0 100644
--- a/.gitignore
+++ b/.gitignore
@@ -8,3 +8,4 @@ __pycache__
 /.coverage
 env*/
 /TODO.md
+/postgres-data/
diff --git a/examples/rag.py b/examples/rag.py
new file mode 100644
index 000000000..3300d5c7b
--- /dev/null
+++ b/examples/rag.py
@@ -0,0 +1,252 @@
+"""RAG example with pydantic-ai.
+
+Run pgvector with:
+
+    mkdir postgres-data
+    docker run --rm -e POSTGRES_PASSWORD=postgres -p 54320:5432 -v `pwd`/postgres-data:/var/lib/postgresql/data pgvector/pgvector:pg17
+
+Build the search DB with:
+
+    uv run --extra examples -m examples.rag build
+
+Ask the agent a question with:
+
+    uv run --extra examples -m examples.rag search "How do I configure logfire to work with FastAPI?"
+"""
+
+from __future__ import annotations as _annotations
+
+import asyncio
+import os
+import re
+import sys
+import unicodedata
+from contextlib import asynccontextmanager
+from dataclasses import dataclass
+from typing import cast
+
+import asyncpg
+import httpx
+import logfire
+import pydantic_core
+from openai import AsyncOpenAI
+from pydantic import TypeAdapter
+from typing_extensions import AsyncGenerator
+
+from pydantic_ai import CallContext
+from pydantic_ai.agent import Agent, KnownModelName
+
+# 'if-token-present' means nothing will be sent (and the example wil work) if you don't have logfire set up
+logfire.configure()
+logfire.instrument_asyncpg()
+
+
+@dataclass
+class Deps:
+    openai: AsyncOpenAI
+    pool: asyncpg.Pool
+
+
+model = cast(KnownModelName, os.getenv('PYDANTIC_AI_MODEL', 'openai:gpt-4o'))
+agent: Agent[Deps, str] = Agent(model)
+
+
+@agent.retriever_context
+async def retrieve(context: CallContext[Deps], search_query: str) -> str:
+    with logfire.span('create embedding for {search_query=}', search_query=search_query):
+        embedding = await context.deps.openai.embeddings.create(
+            input=search_query,
+            model='text-embedding-3-small',
+        )
+
+    assert len(embedding.data) == 1, f'Expected 1 embedding, got {len(embedding.data)}, doc query: {search_query!r}'
+    embedding = embedding.data[0].embedding
+    embedding_json = pydantic_core.to_json(embedding).decode()
+    rows = await context.deps.pool.fetch(
+        'SELECT url, title, content FROM doc_sections ORDER BY embedding <-> $1 LIMIT 8',
+        embedding_json,
+    )
+    return '\n\n'.join(f'# {row['title']}\nDocumentation URL:{row['url']}\n\n{row['content']}\n' for row in rows)
+
+
+async def run_agent(question: str):
+    openai = AsyncOpenAI()
+    logfire.instrument_openai(openai)
+
+    logfire.info('Asking "{question}"', question=question)
+
+    async with database_connect() as pool:
+        deps = Deps(openai=openai, pool=pool)
+        answer = await agent.run(question, deps=deps)
+    print(answer.response)
+
+
+async def search(openai: AsyncOpenAI, pool: asyncpg.Pool, query: str) -> list[str]:
+    with logfire.span('create embedding for {query=}', query=query):
+        embedding = await openai.embeddings.create(
+            input=query,
+            model='text-embedding-3-small',
+        )
+
+    assert len(embedding.data) == 1, f'Expected 1 embedding, got {len(embedding.data)}, doc query: {query!r}'
+    embedding = embedding.data[0].embedding
+    embedding_json = pydantic_core.to_json(embedding).decode()
+    matches = await pool.fetch(
+        'SELECT url FROM doc_sections ORDER BY embedding <-> $1 LIMIT 5',
+        embedding_json,
+    )
+    return [match[0] for match in matches]
+
+
+# JSON document from https://gist.github.com/samuelcolvin/4b5bb9bb163b1122ff17e29e48c10992
+DOCS_JSON = 'https://gist.githubusercontent.com/samuelcolvin/4b5bb9bb163b1122ff17e29e48c10992/raw/80c5925c42f1442c24963aaf5eb1a324d47afe95/logfire_docs.json'
+
+
+async def build_search_db():
+    async with httpx.AsyncClient() as client:
+        response = await client.get(DOCS_JSON)
+        response.raise_for_status()
+    sections = sessions_ta.validate_json(response.content)
+    openai = AsyncOpenAI()
+    logfire.instrument_openai(openai)
+
+    async with database_connect(True) as pool:
+        with logfire.span('create schema'):
+            async with pool.acquire() as conn:
+                async with conn.transaction():
+                    await conn.execute(DB_SCHEMA)
+        await insert_doc_sections(openai, pool, sections)
+
+
+async def insert_doc_sections(openai: AsyncOpenAI, pool: asyncpg.Pool, sections: list[DocsSection]):
+    queue = asyncio.Queue()
+
+    for section in sections:
+        queue.put_nowait(section)
+
+    async def worker():
+        while True:
+            s = cast(DocsSection, await queue.get())
+            try:
+                await insert_doc_section(openai, pool, s)
+            except Exception:
+                logfire.exception('Error inserting {url=}', url=s.url())
+                raise
+            finally:
+                queue.task_done()
+
+    with logfire.span('inserting doc sections'):
+        tasks = [asyncio.create_task(worker()) for _ in range(30)]
+        await queue.join()
+        for task in tasks:
+            task.cancel()
+    await asyncio.gather(*tasks, return_exceptions=True)
+
+
+@logfire.instrument()
+async def insert_doc_section(openai: AsyncOpenAI, pool: asyncpg.Pool, section: DocsSection) -> bool:
+    url = section.url()
+    exists = await pool.fetchval('SELECT 1 FROM doc_sections WHERE url = $1', url)
+    if exists:
+        logfire.info('Skipping {url=}', url=url)
+        return False
+
+    with logfire.span('create embedding for {url=}', url=url):
+        embedding = await openai.embeddings.create(
+            input=section.embedding_content(),
+            model='text-embedding-3-small',
+        )
+    assert len(embedding.data) == 1, f'Expected 1 embedding, got {len(embedding.data)}, doc section: {section}'
+    embedding = embedding.data[0].embedding
+    embedding_json = pydantic_core.to_json(embedding).decode()
+    await pool.execute(
+        'INSERT INTO doc_sections (url, title, content, embedding) VALUES ($1, $2, $3, $4)',
+        url,
+        section.title,
+        section.content,
+        embedding_json,
+    )
+    return True
+
+
+@dataclass
+class DocsSection:
+    id: int
+    parent: int | None
+    path: str
+    level: int
+    title: str
+    content: str
+
+    def url(self) -> str:
+        url_path = re.sub(r'\.md$', '', self.path)
+        return f'https://logfire.pydantic.dev/docs/{url_path}/#{slugify(self.title, '-')}'
+
+    def embedding_content(self) -> str:
+        return '\n\n'.join((f'path: {self.path}', f'title: {self.title}', self.content))
+
+
+sessions_ta = TypeAdapter(list[DocsSection])
+
+
+# pyright: reportUnknownMemberType=false
+# pyright: reportUnknownVariableType=false
+@asynccontextmanager
+async def database_connect(create_db: bool = False) -> AsyncGenerator[asyncpg.Pool, None]:
+    server_dsn, database = 'postgresql://postgres:postgres@localhost:54320', 'pydantic_ai_rag'
+    if create_db:
+        with logfire.span('check and create DB'):
+            conn = await asyncpg.connect(server_dsn)
+            try:
+                db_exists = await conn.fetchval('SELECT 1 FROM pg_database WHERE datname = $1', database)
+                if not db_exists:
+                    await conn.execute(f'CREATE DATABASE {database}')
+            finally:
+                await conn.close()
+
+    pool = await asyncpg.create_pool(f'{server_dsn}/{database}')
+    try:
+        yield pool
+    finally:
+        await pool.close()
+
+
+DB_SCHEMA = """
+CREATE EXTENSION IF NOT EXISTS vector;
+
+CREATE TABLE IF NOT EXISTS doc_sections (
+    id serial PRIMARY KEY,
+    url text NOT NULL UNIQUE,
+    title text NOT NULL,
+    content text NOT NULL,
+    -- text-embedding-3-small returns a vector of 1536 floats
+    embedding vector(1536) NOT NULL
+);
+CREATE INDEX IF NOT EXISTS idx_doc_sections_embedding ON doc_sections USING hnsw (embedding vector_l2_ops);
+"""
+
+
+def slugify(value: str, separator: str, unicode: bool = False) -> str:
+    """Slugify a string, to make it URL friendly."""
+    # Taken unchanged from https://github.com/Python-Markdown/markdown/blob/3.7/markdown/extensions/toc.py#L38
+    if not unicode:
+        # Replace Extended Latin characters with ASCII, i.e. `žlutý` => `zluty`
+        value = unicodedata.normalize('NFKD', value)
+        value = value.encode('ascii', 'ignore').decode('ascii')
+    value = re.sub(r'[^\w\s-]', '', value).strip().lower()
+    return re.sub(rf'[{separator}\s]+', separator, value)
+
+
+if __name__ == '__main__':
+    action = sys.argv[1] if len(sys.argv) > 1 else None
+    if action == 'build':
+        asyncio.run(build_search_db())
+    elif action == 'search':
+        if len(sys.argv) == 3:
+            q = sys.argv[2]
+        else:
+            q = 'How do I configure logfire to work with FastAPI?'
+        asyncio.run(run_agent(q))
+    else:
+        print('uv run --extra examples -m examples.rag build|search', file=sys.stderr)
+        sys.exit(1)
diff --git a/examples/sql_gen.py b/examples/sql_gen.py
index ec68588a5..2a6d32a3f 100644
--- a/examples/sql_gen.py
+++ b/examples/sql_gen.py
@@ -24,6 +24,7 @@
 
 # 'if-token-present' means nothing will be sent (and the example wil work) if you don't have logfire set up
 logfire.configure()
+logfire.instrument_asyncpg()
 
 DB_SCHEMA = """
 CREATE TABLE IF NOT EXISTS records (
diff --git a/pyproject.toml b/pyproject.toml
index 2324f49a1..58e596eb4 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -48,7 +48,7 @@ logfire = [
 ]
 examples = [
     "asyncpg>=0.30.0",
-    "logfire>=1.2.0",
+    "logfire[asyncpg]>=1.2.0",
 ]
 
 [tool.uv]
diff --git a/uv.lock b/uv.lock
index 534720299..146c68534 100644
--- a/uv.lock
+++ b/uv.lock
@@ -592,6 +592,11 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/7d/7f/37d9c3cbed1ef23b467c0c0039f35524595f8fd79f3acb54e647a0ccd590/logfire-1.2.0-py3-none-any.whl", hash = "sha256:edb2b441e418cf31877bd97e24b3755f873bb423f834cca66f315b25bde61ebd", size = 164724 },
 ]
 
+[package.optional-dependencies]
+asyncpg = [
+    { name = "opentelemetry-instrumentation-asyncpg" },
+]
+
 [[package]]
 name = "logfire-api"
 version = "1.2.0"
@@ -750,6 +755,20 @@ wheels = [
     { url = "https://files.pythonhosted.org/packages/0a/7f/405c41d4f359121376c9d5117dcf68149b8122d3f6c718996d037bd4d800/opentelemetry_instrumentation-0.48b0-py3-none-any.whl", hash = "sha256:a69750dc4ba6a5c3eb67986a337185a25b739966d80479befe37b546fc870b44", size = 29449 },
 ]
 
+[[package]]
+name = "opentelemetry-instrumentation-asyncpg"
+version = "0.48b0"
+source = { registry = "https://pypi.org/simple" }
+dependencies = [
+    { name = "opentelemetry-api" },
+    { name = "opentelemetry-instrumentation" },
+    { name = "opentelemetry-semantic-conventions" },
+]
+sdist = { url = "https://files.pythonhosted.org/packages/17/6c/fecc5a597cb2059d3388c497b77ef8caa30c2ce6d2caa8f4517b1a9fae9f/opentelemetry_instrumentation_asyncpg-0.48b0.tar.gz", hash = "sha256:c7cf78f50f489779c3ea526d4fe618589b2606c42ea6ad87d15818f7f70f53d3", size = 8577 }
+wheels = [
+    { url = "https://files.pythonhosted.org/packages/1e/4f/2c8aa63e65947521344c8bef4028dd4e2261fabcd2cd74d737271f36d4d8/opentelemetry_instrumentation_asyncpg-0.48b0-py3-none-any.whl", hash = "sha256:c9a70241120ada6bf4eafd865254165a24ef9a2d1e44aaeecb836817794781f2", size = 9975 },
+]
+
 [[package]]
 name = "opentelemetry-proto"
 version = "1.27.0"
@@ -871,7 +890,7 @@ dependencies = [
 [package.optional-dependencies]
 examples = [
     { name = "asyncpg" },
-    { name = "logfire" },
+    { name = "logfire", extra = ["asyncpg"] },
 ]
 logfire = [
     { name = "logfire" },
@@ -897,8 +916,8 @@ requires-dist = [
     { name = "eval-type-backport", specifier = ">=0.2.0" },
     { name = "griffe", specifier = ">=1.3.2" },
     { name = "httpx", specifier = ">=0.27.2" },
-    { name = "logfire", marker = "extra == 'examples'", specifier = ">=1.2.0" },
     { name = "logfire", marker = "extra == 'logfire'", specifier = ">=1.2.0" },
+    { name = "logfire", extras = ["asyncpg"], marker = "extra == 'examples'", specifier = ">=1.2.0" },
     { name = "logfire-api", specifier = ">=1.2.0" },
     { name = "openai", specifier = ">=1.51.2" },
     { name = "pydantic", specifier = ">=2.9.2" },