documentation-agent/documentation_agent.py at main · Croups/documentation-agent · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
# Enable nested async loops for Jupyter notebooks
import nest_asyncio
nest_asyncio.apply()

# Import required LlamaIndex components for document processing and indexing
from llama_index.core import (
    SimpleDirectoryReader,
    VectorStoreIndex,
)
from llama_index.core.extractors import TitleExtractor
from llama_index.core.ingestion import IngestionPipeline
from llama_index.core.node_parser import SentenceSplitter
from llama_index.core.storage import StorageContext
from llama_index.core.vector_stores import SimpleVectorStore
from llama_index.embeddings.openai import OpenAIEmbedding

# Load documents from the specified directory
documents = SimpleDirectoryReader("docs/learn").load_data()
vector_store = SimpleVectorStore()
storage_context = StorageContext.from_defaults(vector_store=vector_store)

# Set up document processing pipeline with sentence splitting and embedding
pipeline = IngestionPipeline(
    transformations=[
        SentenceSplitter(chunk_size=512, chunk_overlap=128),
        TitleExtractor(),
        OpenAIEmbedding(),
    ],
    vector_store=vector_store,
)

# Process documents through the pipeline and create vector index
nodes = pipeline.run(documents=documents)
index = VectorStoreIndex(
    nodes,
    storage_context=storage_context,
)

# Save the index to disk
index.storage_context.persist()

# Import components for loading saved index
from llama_index.core import (
    load_index_from_storage,
)

# Load the saved index and create query engine
storage_context = StorageContext.from_defaults(persist_dir="storage")
loaded_index = load_index_from_storage(storage_context)
query_engine = loaded_index.as_query_engine()

# Import Mirascope and Pydantic components for response handling
from mirascope.core import openai, prompt_template
from pydantic import BaseModel, Field

# Define data model for document relevance scoring
class Relevance(BaseModel):
    id: int = Field(..., description="The document ID")
    score: int = Field(..., description="The relevance score (1-10)")
    document: str = Field(..., description="The document text")
    reason: str = Field(..., description="A brief explanation for the assigned score")

# GPT-4 function for reranking documents based on relevance
@openai.call(
    "gpt-4o-mini",
    response_model=list[Relevance],
    json_mode=True,
)
@prompt_template(
    """
You are an advanced document relevance assessment system. Your task is to evaluate a list of documents and determine their relevance to a given question. Follow these instructions carefully:

1. Review the question:
<question>
{query}
</question>

2. Examine the list of documents:
<documents>
{documents}
</documents>

3. For each document, perform the following analysis inside document_evaluation tags:
   a. Quote relevant passages from the document.
   b. Consider arguments for and against the document's relevance.
   c. List specific ways the document contributes to answering the question.
   d. Count the number of relevant points made in the document.
   e. Determine if the document is relevant (score 5 or above).
   f. If relevant, analyze its content in relation to the question.
   g. Consider both direct and indirect relevance.
   h. Assess the informativeness of the content, not just keyword matches.
   i. Think about how this document might contribute to a complete answer.
   j. Assign a relevance score from 5 to 10.
   k. Provide a reason for the assigned score.

It's OK for this section to be quite long.

4. After analyzing all documents, consider how they might work together to answer the question.

5. Present your final assessment in the following format:

<assessment>
  <document>
    <id>[Document ID]</id>
    <score>[Relevance score (5-10)]</score>
    <reason>[Explanation for the score]</reason>
  </document>
  [Repeat for each relevant document]
  <overall_analysis>
    [Brief explanation of how the documents collectively address the question]
  </overall_analysis>
</assessment>

Important guidelines:
- Exclude documents with relevance scores below 5.
- Prioritize positive, affirmative information over negative statements.
- Be thorough in your analysis, considering all aspects of each document's relevance.
- Ensure your reasoning is clear and justified.

Begin your assessment now.
    """
)
def llm_query_rerank(documents: list[dict], query: str): ...

# Import typing components
from typing import cast

from llama_index.core import QueryBundle
from llama_index.core.indices.vector_store import VectorIndexRetriever

# Function to retrieve relevant documents based on query
def get_documents(query: str) -> list[str]:
    """The get_documents tool that retrieves Mirascope documentation based on the
    relevance of the query"""
    query_bundle = QueryBundle(query)
    retriever = VectorIndexRetriever(
        index=cast(VectorStoreIndex, loaded_index),
        similarity_top_k=10,
    )
    retrieved_nodes = retriever.retrieve(query_bundle)
    choice_batch_size = 5
    top_n = 2
    results: list[Relevance] = []

    # Process retrieved nodes in batches
    for idx in range(0, len(retrieved_nodes), choice_batch_size):
        nodes_batch = [
            {
                "id": idx + id,
                "text": node.node.get_text(),
                "document_title": node.metadata["document_title"],
                "semantic_score": node.score,
            }
            for id, node in enumerate(retrieved_nodes[idx : idx + choice_batch_size])
        ]
        results += llm_query_rerank(nodes_batch, query)

    # Sort and return top results
    results = sorted(results, key=lambda x: x.score or 0, reverse=True)[:top_n]
    return [result.document for result in results]

# Import components for response handling
from typing import Literal
from pydantic import BaseModel, Field
from mirascope.core import openai, prompt_template

# Define response data model
class Response(BaseModel):
    classification: Literal["code", "general"] = Field(
        ..., description="The classification of the question"
    )
    content: str = Field(..., description="The response content")

# Main documentation agent class
class DocumentationAgent(BaseModel):

    # GPT-4 function to process and answer questions
    @openai.call("gpt-4o-mini", response_model=Response, json_mode=True)
    @prompt_template(
        """
        SYSTEM:
        You are an AI Assistant that is an expert at answering questions about Mirascope.
        Here is the relevant documentation to answer the question.

        First classify the question into one of two types:
            - General Information: Questions about the system or its components.
            - Code Examples: Questions that require code snippets or examples.

        For General Information, provide a summary of the relevant documents if the question is too broad ask for more details.
        If the context does not answer the question, say that the information is not available or you could not find it.

        For Code Examples, output ONLY code without any markdown, with comments if necessary.
        If the context does not answer the question, say that the information is not available.

        Examples:
            Question: "What is Mirascope?"
            Answer:
            classification: general
            content: A toolkit for building AI-powered applications with Large Language Models (LLMs).

            Question: "How do I make a basic OpenAI call?"
            Answer:
            classification: code
            content: |
                from mirascope.core import openai

                @openai.call("gpt-4o-mini")
                def basic_call() -> str:
                    return "Hello, world!"

                response = basic_call()
                print(response.content)

        Context:
        {context:list}

        USER:
        {question}
        """
    )
    def _call(self, question: str) -> openai.OpenAIDynamicConfig:
        # Get relevant documents and prepare response
        documents = get_documents(question)
        return {"computed_fields": {"context": documents}}

    def _step(self, question: str):
        # Process single question and print response
        answer = self._call(question)
        print("(Assistant):", answer.content)

    def run(self):
        # Main interaction loop
        while True:
            question = input("(User): ")
            if question == "exit":
                break
            self._step(question)

# Main execution block
if __name__ == "__main__":
    agent = DocumentationAgent()
    agent.run()