gptme
diff --git a/‎.gitignore
+1 b/‎.gitignore
+1
diff --git a/‎Makefile
+3 b/‎Makefile
+3
diff --git a/‎examples/basic/search.py
+1-1 b/‎examples/basic/search.py
+1-1
diff --git a/‎examples/code-search/search_docs.py
+1-1 b/‎examples/code-search/search_docs.py
+1-1
diff --git a/‎examples/knowledge-base/search_kb.py
+1-1 b/‎examples/knowledge-base/search_kb.py
+1-1
diff --git a/‎gptme_rag/benchmark.py
+1-1 b/‎gptme_rag/benchmark.py
+1-1
diff --git a/‎gptme_rag/cli.py
+93-21 b/‎gptme_rag/cli.py
+93-21
diff --git a/‎gptme_rag/indexing/document_processor.py
+21-18 b/‎gptme_rag/indexing/document_processor.py
+21-18
@@ -44,3 +44,4 @@ benchmark_index/
 
 # Test coverage
 .coverage
+benchmark_data
@@ -4,3 +4,6 @@ test:
 # run linting, typechecking, and tests
 check:
 	pre-commit run --all-files
+
+typecheck:
+	pre-commit run mypy --all-files
@@ -26,7 +26,7 @@ def main():
         indexer.index_directory(docs_dir, glob_pattern="**/*.md")
 
         # Search
-        documents, distances = indexer.search(query, n_results=3)
+        documents, distances, _ = indexer.search(query, n_results=3)
 
         # Display results
         console.print(f"\nResults for: [cyan]{query}[/cyan]\n")
 
@@ -80,7 +80,7 @@ def main():
                     continue
 
                 # Search with chunk grouping
-                documents, distances = indexer.search(
+                documents, distances, _ = indexer.search(
                     query,
                     n_results=5,
                     group_chunks=True,
 
@@ -84,7 +84,7 @@ def main(query: str | None, index_dir: Path, interactive: bool, show_content: bo
         def do_search(search_query: str):
             """Perform search and display results."""
             # Search with chunk grouping
-            documents, distances = indexer.search(
+            documents, distances, _ = indexer.search(
                 search_query,
                 n_results=5,
                 group_chunks=True,
 
@@ -169,7 +169,7 @@ def search_operation():
             )
             total_results = 0
             for query in queries:
-                results, _ = indexer.search(query, n_results=n_results)
+                results, _, _ = indexer.search(query, n_results=n_results)
                 total_results += len(results)
             return {
                 "items_processed": len(queries),
 
@@ -35,9 +35,7 @@ def cli(verbose: bool):
 
 
 @cli.command()
-@click.argument(
-    "directory", type=click.Path(exists=True, file_okay=False, path_type=Path)
-)
+@click.argument("paths", nargs=-1, type=click.Path(exists=True, path_type=Path))
 @click.option(
     "--pattern", "-p", default="**/*.*", help="Glob pattern for files to index"
 )
@@ -47,16 +45,29 @@ def cli(verbose: bool):
     default=default_persist_dir,
     help="Directory to persist the index",
 )
-def index(directory: Path, pattern: str, persist_dir: Path):
-    """Index documents in a directory."""
+def index(paths: list[Path], pattern: str, persist_dir: Path):
+    """Index documents in one or more directories."""
+    if not paths:
+        console.print("❌ No paths provided", style="red")
+        return
+
     try:
         indexer = Indexer(persist_directory=persist_dir, enable_persist=True)
-        console.print(f"Indexing files in {directory} with pattern {pattern}")
-
-        # Index the files
-        n_indexed = indexer.index_directory(directory, pattern)
-
-        console.print(f"✅ Successfully indexed {n_indexed} files", style="green")
+        total_indexed = 0
+
+        for path in paths:
+            if path.is_file():
+                console.print(f"Indexing file: {path}")
+                n_indexed = indexer.index_file(path)
+                if n_indexed is not None:
+                    total_indexed += n_indexed
+            else:
+                console.print(f"Indexing files in {path} with pattern {pattern}")
+                n_indexed = indexer.index_directory(path, pattern)
+                if n_indexed is not None:
+                    total_indexed += n_indexed
+
+        console.print(f"✅ Successfully indexed {total_indexed} files", style="green")
     except Exception as e:
         console.print(f"❌ Error indexing directory: {e}", style="red")
 
@@ -74,6 +85,12 @@ def index(directory: Path, pattern: str, persist_dir: Path):
 @click.option("--max-tokens", default=4000, help="Maximum tokens in context window")
 @click.option("--show-context", is_flag=True, help="Show the full context content")
 @click.option("--raw", is_flag=True, help="Skip syntax highlighting")
+@click.option("--explain", is_flag=True, help="Show scoring explanations")
+@click.option(
+    "--weights",
+    type=click.STRING,
+    help="Custom scoring weights as JSON string, e.g. '{\"recency_boost\": 0.3}'",
+)
 def search(
     query: str,
     paths: list[Path],
@@ -82,21 +99,46 @@ def search(
     max_tokens: int,
     show_context: bool,
     raw: bool,
+    explain: bool,
+    weights: str | None,
 ):
     """Search the index and assemble context."""
     paths = [path.resolve() for path in paths]
 
     # Hide ChromaDB output during initialization and search
     with console.status("Initializing..."):
+        # Parse custom weights if provided
+        scoring_weights = None
+        if weights:
+            try:
+                import json
+
+                scoring_weights = json.loads(weights)
+            except json.JSONDecodeError as e:
+                console.print(f"❌ Invalid weights JSON: {e}", style="red")
+                return
+            except Exception as e:
+                console.print(f"❌ Error parsing weights: {e}", style="red")
+                return
+
         # Temporarily redirect stdout to suppress ChromaDB output
         stdout = sys.stdout
         sys.stdout = open(os.devnull, "w")
         try:
-            indexer = Indexer(persist_directory=persist_dir, enable_persist=True)
-            assembler = ContextAssembler(max_tokens=max_tokens)
-            documents, distances = indexer.search(
-                query, n_results=n_results, paths=paths
+            indexer = Indexer(
+                persist_directory=persist_dir,
+                enable_persist=True,
+                scoring_weights=scoring_weights,
             )
+            assembler = ContextAssembler(max_tokens=max_tokens)
+            if explain:
+                documents, distances, explanations = indexer.search(
+                    query, n_results=n_results, paths=paths, explain=True
+                )
+            else:
+                documents, distances, _ = indexer.search(
+                    query, n_results=n_results, paths=paths
+                )
         finally:
             sys.stdout.close()
             sys.stdout = stdout
@@ -128,20 +170,50 @@ def search(
     for i, doc in enumerate(documents):
         source = doc.metadata.get("source", "unknown")
         distance = distances[i]
-        relevance = 1 - distance  # Convert distance to similarity score
 
-        # Show document header with relevance score
-        console.print(
-            f"\n[cyan]{i+1}. {source}[/cyan] [yellow](relevance: {relevance:.2f})[/yellow]"
-        )
+        # Show document header
+        console.print(f"\n[cyan]{i+1}. {source}[/cyan]")
+
+        # Show scoring explanation if requested
+        if explain and explanations:  # Make sure explanations is not None
+            explanation = explanations[i]
+            console.print("\n[bold]Scoring Breakdown:[/bold]")
+
+            # Show individual score components
+            scores = explanation.get("scores", {})
+            for factor, score in scores.items():
+                # Color code the scores
+                if score > 0:
+                    score_color = "green"
+                    sign = "+"
+                elif score < 0:
+                    score_color = "red"
+                    sign = ""
+                else:
+                    score_color = "yellow"
+                    sign = " "
+
+                # Print score and explanation
+                console.print(
+                    f"  {factor:15} [{score_color}]{sign}{score:>6.3f}[/{score_color}] | {explanation['explanations'][factor]}"
+                )
+
+            # Show total score
+            total = explanation["total_score"]
+            console.print(f"\n  {'Total':15} [bold blue]{total:>7.3f}[/bold blue]")
+        else:
+            # Just show the base relevance score
+            relevance = 1 - distance
+            console.print(f"[yellow](relevance: {relevance:.2f})[/yellow]")
 
         # Use file extension as lexer (strip the dot)
         lexer = doc.metadata.get("extension", "").lstrip(".") or "text"
 
         # Extract preview content (first ~200 chars)
         preview = doc.content[:200] + ("..." if len(doc.content) > 200 else "")
 
-        # Display with syntax highlighting
+        # Display preview with syntax highlighting
+        console.print("\n[bold]Preview:[/bold]")
         syntax = Syntax(
             preview,
             lexer,
 
@@ -72,42 +72,45 @@ def process_text(
                 }
                 return
 
-            # Process in chunks
+            # Process text in chunks based on tokens
             chunk_start = 0
             chunk_count = 0
 
             while chunk_start < len(tokens):
                 # Calculate chunk end
                 chunk_end = min(chunk_start + self.chunk_size, len(tokens))
 
-                # Decode chunk
+                # Get chunk tokens and decode
                 chunk_tokens = tokens[chunk_start:chunk_end]
                 chunk_text = self.encoding.decode(chunk_tokens)
 
                 # Create chunk metadata
-                chunk_metadata = {
-                    **(metadata or {}),
-                    "chunk_index": chunk_count,
-                    "token_count": len(chunk_tokens),
-                    "total_chunks": total_chunks,
-                    "chunk_start": chunk_start,
-                    "chunk_end": chunk_end,
-                }
-
                 yield {
                     "text": chunk_text,
-                    "metadata": chunk_metadata,
+                    "metadata": {
+                        **(metadata or {}),
+                        "chunk_index": chunk_count,
+                        "token_count": len(chunk_tokens),
+                        "total_chunks": total_chunks,
+                        "chunk_start": chunk_start,
+                        "chunk_end": chunk_end,
+                        "is_chunk": True,
+                    },
                 }
 
-                # Move to next chunk
-                chunk_start = chunk_end - self.chunk_overlap
+                # Calculate next chunk start
+                if chunk_end == len(tokens):
+                    # If we've reached the end, we're done
+                    break
+
+                # Move forward by at least one token, considering overlap
+                next_start = chunk_start + max(1, self.chunk_size - self.chunk_overlap)
+                chunk_start = min(next_start, len(tokens) - 1)
                 chunk_count += 1
 
-                # Check stopping conditions
+                # Check max chunks limit
                 if self.max_chunks and chunk_count >= self.max_chunks:
-                    return
-                if len(tokens) - chunk_start <= self.chunk_overlap:
-                    return
+                    break
 
         except Exception as e:
             logger.error(f"Error processing text: {e}")
Original file line number	Diff line number	Diff line change
`@@ -44,3 +44,4 @@ benchmark_index/`
`44`	`44`
`45`	`45`	`# Test coverage`
`46`	`46`	`.coverage`
	`47`	`+benchmark_data`
Original file line number	Diff line number	Diff line change
`@@ -169,7 +169,7 @@ def search_operation():`
`169`	`169`	`)`
`170`	`170`	`total_results = 0`
`171`	`171`	`for query in queries:`
`172`		`- results, _ = indexer.search(query, n_results=n_results)`
	`172`	`+ results, _, _ = indexer.search(query, n_results=n_results)`
`173`	`173`	`total_results += len(results)`
`174`	`174`	`return {`
`175`	`175`	`"items_processed": len(queries),`