-
Notifications
You must be signed in to change notification settings - Fork 4
/
Copy pathcreate_knowledge_base.py
37 lines (25 loc) · 1 KB
/
create_knowledge_base.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
#!/usr/bin/env python3
import argparse
from pathlib import Path
from dotenv import load_dotenv
from knowledge_base import KnowledgeBase
def main() -> None:
load_dotenv()
parser = argparse.ArgumentParser(description="Create a knowledge base from a directory of documents")
parser.add_argument("directory", type=str, help="Directory containing documents to index")
args = parser.parse_args()
# Convert to Path object and ensure it exists
input_dir = Path(args.directory)
if not input_dir.exists():
print(f"Error: Directory '{input_dir}' does not exist")
return
# Create output directory if it doesn't exist
output_dir = Path(__file__).parent / "vector_store"
output_dir.mkdir(exist_ok=True)
print(f"Creating knowledge base from {input_dir} ...")
kb = KnowledgeBase.from_directory(str(input_dir))
print(f"Persisting knowledge base to {output_dir} ...")
kb.persist(str(output_dir))
print("Done!")
if __name__ == "__main__":
main()