log-vector/ask.py at dev · barrulus/log-vector · GitHub

1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
#!/usr/bin/env python3
"""
Interactive Log File Query Tool

Query your indexed log files using natural language and get AI-generated answers.
Uses the embeddings created by index.py and generates responses using Ollama.

Usage:
    python ask.py [options]

Options:
    output_file       Markdown file to save Q&A pairs (default: ask-YYYY-Month-DD-HH-MM.md)
    --top-k N         Number of results to retrieve (default from DEFAULT_TOP_K env var)
    --model MODEL     Override the Ollama LLM model
"""

import os
import sys
import json
import argparse
from typing import List, Dict, Any, Optional, cast
from datetime import datetime
from pathlib import Path

import chromadb
from rich.console import Console
from rich.markdown import Markdown
from ollama import Client
from dotenv import load_dotenv

from config import (
    OLLAMA_HOST,
    OLLAMA_MODEL,
    CHROMA_PATH,
    EMBEDDING_MODEL,
    DEFAULT_OUTPUT_FILE_PREFIX,
    DEFAULT_TOP_K,
)
from index import LocalEmbeddingHandler, OllamaEmbeddingHandler, RemoteEmbeddingHandler

# Reload .env so trust settings are available
load_dotenv()

# Initialize console
console = Console()


def get_default_output_file() -> str:
    """Generate a timestamp-based output filename"""
    timestamp = datetime.now().strftime("%Y-%B-%d-%H-%M")
    return f"{DEFAULT_OUTPUT_FILE_PREFIX}-{timestamp}.md"


class QueryHandler:
    """Handle querying and embedding generation"""

    def __init__(self, ollama_model: str = OLLAMA_MODEL):
        self.ollama_client = Client(host=OLLAMA_HOST)
        self.ollama_model = ollama_model
        self.collection: Optional[Any] = None
        self.embedding_type: Optional[str] = None
        self.embedding_model: str = EMBEDDING_MODEL
        self._handler: Optional[Any] = None
        self._load_database()
        self._load_metadata()

    def _load_database(self) -> None:
        """Load ChromaDB collection"""
        db_path = CHROMA_PATH

        if os.path.exists(db_path):
            try:
                client = chromadb.PersistentClient(path=db_path)
                self.collection = client.get_collection("vectors")
                console.print(f"[green]✓ Using database at: {db_path}[/green]")
                console.print(f"[green]✓ Collection: vectors[/green]")
                return
            except Exception as e:
                console.print(f"[red]Error loading collection 'vectors': {e}[/red]")

        raise Exception(
            f"No indexed database found at {db_path}. Please run: python index.py /path/to/repository"
        )

    def _load_metadata(self) -> None:
        """Load indexing metadata to determine embedding type"""
        metadata_path = Path(CHROMA_PATH) / "index_metadata.json"

        if metadata_path.exists():
            try:
                with open(metadata_path, 'r') as f:
                    metadata = json.load(f)
                    self.embedding_type = metadata.get('embedding_type')
                    self.embedding_model = metadata.get('embedding_model', EMBEDDING_MODEL)

                    if not self.embedding_type:
                        raise ValueError("Missing embedding_type in metadata")

                    console.print(f"[cyan]Embedding type: {self.embedding_type}[/cyan]")
                    console.print(f"[cyan]Embedding model: {self.embedding_model}[/cyan]")
            except Exception as e:
                console.print(f"[red]Error loading metadata: {e}[/red]")
                console.print("[red]Please re-index your repository with: python index.py /path/to/repository[/red]")
                raise Exception("Invalid or missing metadata. Re-indexing required.")
        else:
            console.print(f"[red]No metadata file found at {metadata_path}[/red]")
            console.print("[red]Please index your repository first with: python index.py /path/to/repository[/red]")
            raise Exception("No index metadata found. Please run indexing first.")

    def _get_handler(self) -> Any:
        """Lazily initialise the right embedding handler based on index metadata."""
        if self._handler is None:
            if self.embedding_type == "ollama":
                self._handler = OllamaEmbeddingHandler(self.embedding_model)
            elif self.embedding_type == "local":
                self._handler = LocalEmbeddingHandler(self.embedding_model)
            else:
                self._handler = RemoteEmbeddingHandler(self.embedding_model)
        return self._handler

    def get_embedding(self, text: str) -> List[float]:
        """Get embedding using the appropriate handler from index.py"""
        handler = self._get_handler()
        result = handler.embed([text])
        return result[0]

    def query_codebase(self, question: str, top_k: int = DEFAULT_TOP_K) -> str:
        """Query the logs and generate a response"""
        # Get embedding for the question
        try:
            q_embed = self.get_embedding(question)
        except Exception as e:
            return f"Error generating embedding: {e}"

        # Query ChromaDB
        if not self.collection:
            return "Database collection not loaded."

        results = self.collection.query(
            query_embeddings=[q_embed],
            n_results=top_k
        )

        # Build context from results
        context = ""
        if results.get('documents') and results.get('metadatas'):
            documents = cast(List[Any], results['documents'][0] if results['documents'] else [])
            metadatas = cast(List[Dict[str, Any]], results['metadatas'][0] if results['metadatas'] else [])
            for doc, meta in zip(documents, metadatas):
                source = str(meta.get('source', meta.get('file', 'Unknown')) if meta else 'Unknown')
                chunk_idx = str(meta.get('chunk_index', '') if meta else '')

                context += f"File: {source}"
                if chunk_idx:
                    context += f" (chunk {chunk_idx})"
                context += f"\n{str(doc)}\n\n"

        if not context:
            return "No relevant data found for your question."

        # Generate response using Ollama
        prompt = f"""You are a helpful systems administrator. Here's some relevant server log context:

{context}

Now answer this question: {question}

Format your entire response using markdown with appropriate headers, code blocks, bullet points, etc."""

        try:
            response = cast(Any, self.ollama_client.chat(  # type: ignore[misc]
                model=self.ollama_model,
                messages=[
                    {
                        "role": "system",
                        "content": "You are a systems administrator that provides clear, accurate answers based on the provided server log context. Always format your responses in well-structured markdown."
                    },
                    {
                        "role": "user",
                        "content": prompt
                    }
                ],
                think=False
            ))
            # Handle the response - expect dict with 'message' key
            if hasattr(response, 'get') and response.get('message'):
                message = response.get('message', {})
                if hasattr(message, 'get'):
                    content = message.get('content', '')
                    return str(content) if content else "No content in response"
                return str(message)
            return "Error: Invalid response format"
        except Exception as e:
            return f"Error generating response: {e}"


def write_to_markdown(question: str, answer: str, filename: str) -> None:
    """Append question and answer to a markdown file with timestamp"""
    timestamp = datetime.now().strftime("%Y-%m-%d %H:%M:%S")

    # Create the file if it doesn't exist
    if not os.path.exists(filename):
        with open(filename, "w", encoding="utf-8") as f:
            f.write("# Log File Query Log\n\n")
            f.write("This file contains questions and answers about the Log Files.\n\n")

    # Append the Q&A pair
    with open(filename, "a", encoding="utf-8") as f:
        f.write(f"## Question [{timestamp}]\n\n")
        f.write(f"**Q:** {question}\n\n")
        f.write(f"**A:**\n\n{answer}\n\n")
        f.write("---\n\n")


def main() -> None:
    """Main interactive loop"""
    parser = argparse.ArgumentParser(
        description="Interactive log file query tool",
        formatter_class=argparse.RawDescriptionHelpFormatter,
        epilog=__doc__,
    )
    parser.add_argument(
        'output_file',
        nargs='?',
        default=get_default_output_file(),
        help='Markdown file to save Q&A pairs (default: ask-YYYY-Month-DD-HH-MM.md)',
    )
    parser.add_argument(
        '--top-k',
        type=int,
        default=DEFAULT_TOP_K,
        help=f'Number of results to retrieve (default: {DEFAULT_TOP_K})',
    )
    parser.add_argument(
        '--model',
        type=str,
        default=OLLAMA_MODEL,
        help=f'Ollama LLM model for response generation (default: {OLLAMA_MODEL})',
    )

    args = parser.parse_args()
    output_file: str = args.output_file

    console.print(f"\n[bold cyan]Log Query Tool[/bold cyan]")
    console.print(f"Output file: [cyan]{output_file}[/cyan]")
    console.print(f"Ollama model: [cyan]{args.model}[/cyan]")
    console.print("\nType 'exit' or 'quit' to stop.\n")

    # Initialize query handler
    try:
        handler = QueryHandler(ollama_model=args.model)
    except Exception as e:
        console.print(f"[red]Error: {e}[/red]")
        sys.exit(1)

    # Interactive loop
    while True:
        try:
            question = input("\n[?] Ask a question about the log files: ")

            if question.lower() in ['exit', 'quit', 'q']:
                console.print(f"\n[green]✓ All responses saved to {output_file}[/green]")
                break

            if not question.strip():
                continue

            # Generate answer
            console.print("\n[yellow]Searching log files and generating response...[/yellow]")
            answer = handler.query_codebase(question, top_k=args.top_k)

            # Write to file
            write_to_markdown(question, answer, output_file)

            # Display answer
            console.print("\n[bold]Answer:[/bold]\n")
            console.print(Markdown(answer))

            console.print(f"\n[dim]Response saved to {output_file}[/dim]")

        except KeyboardInterrupt:
            console.print("\n\n[yellow]Interrupted. Exiting...[/yellow]")
            break
        except Exception as e:
            console.print(f"\n[red]Error: {e}[/red]")


if __name__ == "__main__":
    main()