diff --git a/.gitignore b/.gitignore
index e41eca8..1f7f108 100644
--- a/.gitignore
+++ b/.gitignore
@@ -11,7 +11,11 @@ venv/
 # Generated
 embeddings.json
 
+# Vector database storage
+chroma_db/
+
 # Package build artifacts
 *.egg-info/
 dist/
 build/
+*.dist-info/
diff --git a/README.md b/README.md
index 36fcda1..d86deff 100644
--- a/README.md
+++ b/README.md
@@ -10,10 +10,18 @@ A progressive RAG system built from first principles -- from raw embeddings and
 <tr>
 <td valign="top" width="55%">
 
-1. **Chunks** text documents into overlapping word windows so meaning is preserved at boundaries
-2. **Embeds** each chunk using the OpenAI `text-embedding-3-small` API, producing a 1536-dimensional vector per chunk
-3. **Stores** vectors alongside the original text in a local `embeddings.json` file
-4. **Searches** by embedding a natural language query using the same model, then ranking all chunks by cosine similarity and returning the top-K matches
+Ingestion
+
+1. **Loads** `.txt` files (PDF, DOCX, Markdown from Phase 4)
+2. **Chunks** each document into overlapping word windows
+3. **Embeds** each chunk using OpenAI `text-embedding-3-small`, producing a 1536-dimensional vector
+4. **Stores** vectors with metadata (`source`, `chunk_index`) in a persistent Chroma collection
+
+Search
+
+1. **Embeds** the query using the same model
+2. **Queries** Chroma for the top-K nearest vectors using built-in ANN (Approximate Nearest Neighbor) search
+3. **Returns** results with chunk text, source filename, and distance score
 
 </td>
 <td valign="top" width="45%">
@@ -30,8 +38,7 @@ A progressive RAG system built from first principles -- from raw embeddings and
 
 - Python 3.12
 - OpenAI SDK (`text-embedding-3-small`)
-- NumPy (cosine similarity)
-- Plain JSON (storage -- current phase)
+- Chroma (persistent vector database)
 - python-dotenv
 
 ---
@@ -40,19 +47,23 @@ A progressive RAG system built from first principles -- from raw embeddings and
 
 ```text
 rag-document-engine/
-├── documents/              # Sample .txt files to embed
+├── documents/                  # Sample .txt files
 │   ├── ancient-rome.txt
 │   ├── climate-change.txt
 │   ├── music-and-the-brain.txt
 │   ├── nutrition-and-health.txt
 │   └── space-exploration.txt
-├── embed.py                # Load, chunk, embed documents -> embeddings.json
-├── search.py               # Embed query + retrieve top-K chunks by cosine similarity
-├── utils.py                # chunk_text and cosine_similarity helpers
+├── embed.py                    # embed_chunks and embed_query utilities
+├── ingest.py                   # Load, chunk, embed, store in Chroma
+├── search.py                   # Embed query + retrieve top-K from Chroma
+├── inspect_collection.py       # Print collection stats and a sample entry
+├── utils.py                    # chunk_text, load_document, load_documents
+├── chroma_db/                  # Chroma persistent storage (not committed)
+├── diagrams/                   # Pipeline diagrams
 ├── docs/
 │   └── implementation-plan.md  # Phase-by-phase build plan
 ├── pyproject.toml
-└── .env                    # API keys (not committed)
+└── .env                        # API keys (not committed)
 ```
 
 ---
@@ -77,11 +88,14 @@ EMBEDDING_MODEL=text-embedding-3-small
 ## Usage
 
 ```bash
-# Step 1 -- Embed all documents (generates embeddings.json)
-python3 embed.py
+# Step 1 -- Ingest documents into Chroma
+python3 ingest.py
 
 # Step 2 -- Search
 python3 search.py
+
+# Inspect the collection
+python3 inspect_collection.py
 ```
 
 The query is set in `search.py` main. Change it to anything you want to search for.
@@ -93,22 +107,23 @@ The query is set in `search.py` main. Change it to anything you want to search f
 Query: `"what foods are good for the heart"`
 
 ```text
-Result 1 (score: 0.3571)
-Nutrition is the science of how food affects the body. The food we eat provides energy and
-the raw materials needed to build and repair tissues... Unsaturated fats found in olive oil,
+Result 1 (distance: 1.2862) -- nutrition-and-health.txt [chunk 0]
+Nutrition is the science of how food affects the body... Unsaturated fats found in olive oil,
 nuts, avocados, and fatty fish are associated with reduced risk of heart disease...
 
-Result 2 (score: 0.3143)
+Result 2 (distance: 1.3720) -- nutrition-and-health.txt [chunk 1]
 The Mediterranean diet -- rich in vegetables, fruit, whole grains, fish, and olive oil -- is
 consistently associated with lower rates of heart disease, diabetes, and cognitive decline...
 
-Result 3 (score: 0.1786)
+Result 3 (distance: 1.6426) -- music-and-the-brain.txt [chunk 1]
 Music also affects mood and stress. Slow, quiet music activates the parasympathetic nervous
 system, lowering heart rate and cortisol levels...
 ```
 
 The top two results come from the nutrition document. Result 3 surfaces from the music document because it mentions "heart rate" -- semantic search catches conceptual overlap, not just keyword matches.
 
+Note: distance is an inverse similarity score -- lower means more relevant.
+
 ---
 
 ## Progress
@@ -116,7 +131,7 @@ The top two results come from the nutrition document. Result 3 surfaces from the
 | Phase | Title | Status |
 | ----: | ----- | ------ |
 | 1 | Semantic Foundation | Complete |
-| 2 | Vector Store | In Progress |
+| 2 | Vector Store | Complete |
 | 3 | RAG Pipeline | Planned |
 | 4 | Document Ingestion | Planned |
 | 5 | Retrieval Quality | Planned |
@@ -133,10 +148,11 @@ See [docs/implementation-plan.md](./docs/implementation-plan.md) for full phase
 - **Cosine similarity** -- measures the angle between vectors; direction encodes meaning, magnitude does not
 - **Chunking** -- splits documents into overlapping windows so meaning is not diluted or cut at boundaries
 - **Model consistency** -- the same embedding model must be used for both documents and queries
+- **Vector database** -- stores embeddings with metadata and retrieves them by similarity using ANN search
 - **RAG** -- Retrieval-Augmented Generation: retrieve relevant context, then generate a grounded answer
 
 ---
 
 ## Diagrams
 
-The pipeline diagram is maintained as a PlantUML source file (`pipeline.puml`) and auto-exported to SVG on every push to main using [diagram-sync](https://www.npmjs.com/package/diagram-sync).
+Pipeline diagrams are maintained as PlantUML source files in `diagrams/` and auto-exported to SVG on every push to main using [diagram-sync](https://www.npmjs.com/package/diagram-sync).
diff --git a/diagrams/pipeline.puml b/diagrams/pipeline.puml
new file mode 100644
index 0000000..98d320e
--- /dev/null
+++ b/diagrams/pipeline.puml
@@ -0,0 +1,60 @@
+@startuml pipeline-phase2
+
+skinparam backgroundColor #FFFFFF
+skinparam defaultFontName Arial
+skinparam defaultFontSize 13
+skinparam ArrowColor #555555
+skinparam componentStyle rectangle
+
+skinparam component {
+  BackgroundColor #EEF3FB
+  BorderColor #5577AA
+  FontColor #222222
+}
+
+skinparam database {
+  BackgroundColor #FFF8E7
+  BorderColor #CC9900
+}
+
+skinparam cloud {
+  BackgroundColor #F0FFF0
+  BorderColor #448844
+}
+
+title Phase 2 -- Chroma Vector Store Pipeline
+
+package "Ingestion (ingest.py)" {
+  [.txt files] as docs
+  [load_documents()] as load
+  [chunk_text()] as chunk
+  [embed_chunks()] as embed
+}
+
+cloud "OpenAI API\ntext-embedding-3-small" as openai
+
+database "Chroma DB\n(persistent)" as chroma
+
+package "Search (search.py)" {
+  [Query] as query
+  [embed_query()] as embedq
+  [collection.query()] as cquery
+  [Top-K Results\n(text + source + distance)] as results
+}
+
+docs --> load
+load --> chunk
+chunk --> embed
+embed --> openai : API call
+openai --> embed : 1536-dim vectors
+embed --> chroma : upsert with\nids + metadata
+
+query --> embedq
+embedq --> openai : API call
+openai --> embedq : query vector
+embedq --> cquery
+cquery --> chroma : ANN search
+chroma --> cquery : nearest vectors
+cquery --> results
+
+@enduml
diff --git a/diagrams/pipeline.svg b/diagrams/pipeline.svg
deleted file mode 100644
index aacf16b..0000000
--- a/diagrams/pipeline.svg
+++ /dev/null
@@ -1,80 +0,0 @@
-<?xml version="1.0" encoding="UTF-8" standalone="no"?><svg xmlns="http://www.w3.org/2000/svg" xmlns:xlink="http://www.w3.org/1999/xlink" contentScriptType="application/ecmascript" contentStyleType="text/css" height="668px" preserveAspectRatio="none" style="width:425px;height:668px;background:#FAFAFA;" version="1.1" viewBox="0 0 425 668" width="425px" zoomAndPan="magnify"><defs><filter height="300%" id="ft2u3n2i3ka5f" width="300%" x="-1" y="-1"><feGaussianBlur result="blurOut" stdDeviation="2.0"/><feColorMatrix in="blurOut" result="blurOut2" type="matrix" values="0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 0 .4 0"/><feOffset dx="4.0" dy="4.0" in="blurOut2" result="blurOut3"/><feBlend in="SourceGraphic" in2="blurOut3" mode="normal"/></filter></defs><g><!--MD5=[ff4c7cbfc86cbafc5088fc7dc3b82e86]
-cluster Indexing — embed.py--><polygon fill="#EEF2FF" filter="url(#ft2u3n2i3ka5f)" points="22,24,189,24,196,45.1328,218,45.1328,218,454,22,454,22,24" style="stroke: #000000; stroke-width: 1.5;"/><line style="stroke: #000000; stroke-width: 1.5;" x1="22" x2="196" y1="45.1328" y2="45.1328"/><text fill="#000000" font-family="Arial" font-size="13" font-weight="bold" lengthAdjust="spacingAndGlyphs" textLength="161" x="26" y="38.0669">Indexing — embed.py</text><!--MD5=[b7354f1b6b1a4ce6b3292a1a387e6ba1]
-cluster Search — search.py--><polygon fill="#FDF4FF" filter="url(#ft2u3n2i3ka5f)" points="242,258.5,393,258.5,400,279.6328,403,279.6328,403,656,242,656,242,258.5" style="stroke: #000000; stroke-width: 1.5;"/><line style="stroke: #000000; stroke-width: 1.5;" x1="242" x2="400" y1="279.6328" y2="279.6328"/><text fill="#000000" font-family="Arial" font-size="13" font-weight="bold" lengthAdjust="spacingAndGlyphs" textLength="145" x="246" y="272.5669">Search — search.py</text><!--MD5=[57a5b41ed6b3ba96fe9b4a740eb3fdc7]
-entity docs--><polygon fill="#FEFECE" filter="url(#ft2u3n2i3ka5f)" points="67,58,113,58,120,79,173,79,173,111.2656,67,111.2656,67,58" style="stroke: #000000; stroke-width: 1.5;"/><line style="stroke: #000000; stroke-width: 1.5;" x1="67" x2="120" y1="79" y2="79"/><text fill="#000000" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="76" x="77" y="98.0669">documents/</text><!--MD5=[ff858b2fa29ed35ae3d882895b3a15f0]
-entity chunk--><rect fill="#EFF6FF" filter="url(#ft2u3n2i3ka5f)" height="50.2656" rx="6" ry="6" style="stroke: #3B82F6; stroke-width: 1.5;" width="164" x="38" y="171"/><text fill="#1E3A8A" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="70" x="48" y="193.0669">chunk_text</text><text fill="#1E3A8A" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="144" x="48" y="208.1997">300 words · 50 overlap</text><!--MD5=[1a7a766028402bec58ce31452d7a7648]
-entity embed--><rect fill="#EFF6FF" filter="url(#ft2u3n2i3ka5f)" height="50.2656" rx="6" ry="6" style="stroke: #3B82F6; stroke-width: 1.5;" width="117" x="65.5" y="281"/><text fill="#1E3A8A" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="97" x="75.5" y="303.0669">embed_chunks</text><text fill="#1E3A8A" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="70" x="75.5" y="318.1997">OpenAI API</text><!--MD5=[0686720d71d32ea68f81164171d509ce]
-entity store--><path d="M67.5,404 C67.5,394 132,394 132,394 C132,394 196.5,394 196.5,404 L196.5,428.1328 C196.5,438.1328 132,438.1328 132,438.1328 C132,438.1328 67.5,438.1328 67.5,428.1328 L67.5,404 " fill="#FEF9C3" filter="url(#ft2u3n2i3ka5f)" style="stroke: #EAB308; stroke-width: 1.5;"/><path d="M67.5,404 C67.5,414 132,414 132,414 C132,414 196.5,414 196.5,404 " fill="none" style="stroke: #EAB308; stroke-width: 1.5;"/><text fill="#713F12" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="109" x="77.5" y="430.0669">embeddings.json</text><ellipse cx="320.8701" cy="306.2005" fill="#F0FDF4" filter="url(#ft2u3n2i3ka5f)" rx="29.8701" ry="13.7005" style="stroke: #22C55E; stroke-width: 1.5;"/><text fill="#14532D" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="38" x="301.8701" y="310.2669">Query</text><!--MD5=[81edeb3f3a35c1dab7f46e9decfdfebe]
-entity embedq--><rect fill="#EFF6FF" filter="url(#ft2u3n2i3ka5f)" height="50.2656" rx="6" ry="6" style="stroke: #3B82F6; stroke-width: 1.5;" width="108" x="267" y="391"/><text fill="#1E3A8A" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="88" x="277" y="413.0669">embed_query</text><text fill="#1E3A8A" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="70" x="277" y="428.1997">OpenAI API</text><!--MD5=[3db17c234f6b9cf849b9b762d4cff762]
-entity cosine--><rect fill="#EFF6FF" filter="url(#ft2u3n2i3ka5f)" height="50.2656" rx="6" ry="6" style="stroke: #3B82F6; stroke-width: 1.5;" width="125" x="258.5" y="501"/><text fill="#1E3A8A" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="105" x="268.5" y="523.0669">cosine_similarity</text><text fill="#1E3A8A" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="81" x="268.5" y="538.1997">vs all chunks</text><ellipse cx="320.7736" cy="625.4547" fill="#F0FDF4" filter="url(#ft2u3n2i3ka5f)" rx="60.2736" ry="14.4547" style="stroke: #22C55E; stroke-width: 1.5;"/><text fill="#14532D" font-family="Arial" font-size="13" lengthAdjust="spacingAndGlyphs" textLength="86" x="277.7736" y="629.5211">Top-K Results</text><!--MD5=[58d0584bf00a192df52be675af4060c3]
-link docs to chunk--><path d="M120,111.21 C120,111.21 120,165.66 120,165.66 " fill="none" id="docs-&gt;chunk" style="stroke: #555555; stroke-width: 2.0;"/><polygon fill="#555555" points="120,170.66,124,161.66,120,165.66,116,161.66,120,170.66" style="stroke: #555555; stroke-width: 2.0;"/><!--MD5=[f719c65e3cd5877eb9f397b030baf6d1]
-link chunk to embed--><path d="M124,221.24 C124,221.24 124,275.88 124,275.88 " fill="none" id="chunk-&gt;embed" style="stroke: #555555; stroke-width: 2.0;"/><polygon fill="#555555" points="124,280.88,128,271.88,124,275.88,120,271.88,124,280.88" style="stroke: #555555; stroke-width: 2.0;"/><!--MD5=[3fff7060fd0c4e8b3dcde3a0a24b4cc6]
-link embed to store--><path d="M125,331.24 C125,331.24 125,388.86 125,388.86 " fill="none" id="embed-&gt;store" style="stroke: #555555; stroke-width: 2.0;"/><polygon fill="#555555" points="125,393.86,129,384.86,125,388.86,121,384.86,125,393.86" style="stroke: #555555; stroke-width: 2.0;"/><!--MD5=[8efdc581dcc4934b230519e9a1c62620]
-link query to embedq--><path d="M321,319.93 C321,319.93 321,385.88 321,385.88 " fill="none" id="query-&gt;embedq" style="stroke: #555555; stroke-width: 2.0;"/><polygon fill="#555555" points="321,390.88,325,381.88,321,385.88,317,381.88,321,390.88" style="stroke: #555555; stroke-width: 2.0;"/><!--MD5=[07d0e59a576869aa907c1b73aa635231]
-link embedq to cosine--><path d="M321,441.24 C321,441.24 321,495.88 321,495.88 " fill="none" id="embedq-&gt;cosine" style="stroke: #555555; stroke-width: 2.0;"/><polygon fill="#555555" points="321,500.88,325,491.88,321,495.88,317,491.88,321,500.88" style="stroke: #555555; stroke-width: 2.0;"/><!--MD5=[4684471f6051558c3413dfb8791f28b5]
-link cosine to results--><path d="M321,551.11 C321,551.11 321,605.9 321,605.9 " fill="none" id="cosine-&gt;results" style="stroke: #555555; stroke-width: 2.0;"/><polygon fill="#555555" points="321,610.9,325,601.9,321,605.9,317,601.9,321,610.9" style="stroke: #555555; stroke-width: 2.0;"/><!--MD5=[a0c1a4ea2fae617c4a25a3db61a81add]
-link store to cosine--><path d="M196.61,416 C229.55,416 262.75,416 262.75,416 C262.75,416 262.75,495.76 262.75,495.76 " fill="none" id="store-&gt;cosine" style="stroke: #555555; stroke-width: 2.0;"/><polygon fill="#555555" points="262.75,500.76,266.75,491.76,262.75,495.76,258.75,491.76,262.75,500.76" style="stroke: #555555; stroke-width: 2.0;"/><!--MD5=[b5895bd08e5963fd690290115f3d9b71]
-@startuml pipeline
-skinparam direction left to right
-skinparam backgroundColor #FAFAFA
-skinparam defaultFontName Arial
-skinparam defaultFontSize 13
-skinparam ArrowColor #555555
-skinparam ArrowThickness 2
-skinparam linetype ortho
-
-skinparam rectangle {
-    BackgroundColor #EFF6FF
-    BorderColor #3B82F6
-    FontColor #1E3A8A
-    RoundCorner 12
-}
-
-skinparam database {
-    BackgroundColor #FEF9C3
-    BorderColor #EAB308
-    FontColor #713F12
-}
-
-skinparam usecase {
-    BackgroundColor #F0FDF4
-    BorderColor #22C55E
-    FontColor #14532D
-}
-
-package "Indexing — embed.py" #EEF2FF {
-    folder "documents/" as docs
-    rectangle "chunk_text\n300 words · 50 overlap" as chunk
-    rectangle "embed_chunks\nOpenAI API" as embed
-    database "embeddings.json" as store
-
-    docs - -> chunk
-    chunk - -> embed
-    embed - -> store
-}
-
-package "Search — search.py" #FDF4FF {
-    usecase "Query" as query
-    rectangle "embed_query\nOpenAI API" as embedq
-    rectangle "cosine_similarity\nvs all chunks" as cosine
-    usecase "Top-K Results" as results
-
-    query - -> embedq
-    embedq - -> cosine
-    cosine - -> results
-}
-
-store - -> cosine
-
-@enduml
-
-PlantUML version 1.2020.02(Sun Mar 01 10:22:07 UTC 2020)
-(GPL source distribution)
-Java Runtime: OpenJDK Runtime Environment
-JVM: OpenJDK 64-Bit Server VM
-Java Version: 17.0.19+10
-Operating System: Linux
-Default Encoding: UTF-8
-Language: en
-Country: null
---></g></svg>
\ No newline at end of file
diff --git a/docs/implementation-plan.md b/docs/implementation-plan.md
index 974b663..d96f3ca 100644
--- a/docs/implementation-plan.md
+++ b/docs/implementation-plan.md
@@ -58,7 +58,7 @@ The chunking and embedding logic from Phase 1 carries over unchanged. The only t
 
 - `chromadb` -- local persistent vector database
 
-**Status:** In Progress
+**Status:** Complete
 
 **Vector DB tradeoffs to understand:**
 
diff --git a/embed.py b/embed.py
index e6cd6c7..47ac3f6 100644
--- a/embed.py
+++ b/embed.py
@@ -1,7 +1,5 @@
 from openai import OpenAI
 from dotenv import load_dotenv
-from utils import chunk_text
-import json
 import os
 
 load_dotenv()
@@ -14,32 +12,8 @@ def embed_chunks(chunks: list[str]) -> list[dict]:
         model=os.getenv("EMBEDDING_MODEL"),
         input=chunks
     )
-
     return [{"text": chunk, "embedding": response.data[i].embedding} for i, chunk in enumerate(chunks)]
 
+
 def embed_query(query: str) -> list[float]:
     return embed_chunks([query])[0]["embedding"]
-
-def load_document(filepath: str) -> str:
-    try:
-        with open(filepath, 'r') as f:
-            return f.read()
-    except FileNotFoundError as e:
-        raise FileNotFoundError(f"Document not found: {filepath}: {e}")
-
-def response_write(filepath: str, embeddings: list[dict]) -> bool:
-    try:
-        with open(filepath, 'w') as f:
-            json.dump(embeddings, f)
-    except IOError as e:
-        raise IOError(f"Failed to wrte embeddings: {e}")
-
-def main():
-    file_names = os.listdir("documents/")
-    json_response = []
-    for file_name in filter(lambda f: f.endswith('.txt'), file_names):
-        json_response.extend(embed_chunks(chunk_text(load_document(f"documents/{file_name}"))))
-    response_write("embeddings.json", json_response)
-
-if __name__ == '__main__':
-    main()
\ No newline at end of file
diff --git a/ingest.py b/ingest.py
new file mode 100644
index 0000000..1952dc0
--- /dev/null
+++ b/ingest.py
@@ -0,0 +1,31 @@
+from utils import chunk_text, load_documents
+from embed import embed_chunks
+import chromadb
+
+client = chromadb.PersistentClient(path="./chroma_db")
+
+
+def main():
+    collection = client.get_or_create_collection(name="documents")
+
+    for doc in load_documents("documents/"):
+        chunks = chunk_text(doc["text"])
+        embedded = embed_chunks(chunks)
+
+        # Delete existing chunks for this source before re-ingesting
+        if collection.count() > 0:
+            collection.delete(where={"source": doc["filename"]})
+
+        collection.upsert(
+            ids = [f"{doc['filename']}_{i}" for i in range(len(chunks))],
+            embeddings = [e["embedding"] for e in embedded],
+            documents = chunks,
+            metadatas = [{"source": doc["filename"], "chunk_index": i} for i in range(len(chunks))]
+        )
+
+        print(f"Ingested {len(chunks)} chunks from {doc['filename']}")
+
+    print(f"\nTotal vectors in collection: {collection.count()}")
+
+if __name__ == '__main__':
+    main()
diff --git a/inspect_collection.py b/inspect_collection.py
new file mode 100644
index 0000000..70c4f36
--- /dev/null
+++ b/inspect_collection.py
@@ -0,0 +1,25 @@
+import chromadb
+
+client = chromadb.PersistentClient(path="./chroma_db")
+
+
+def main():
+    collection = client.get_or_create_collection(name="documents")
+
+    print(f"Total vectors in collection: {collection.count()}\n")
+
+    sample = collection.get(
+        limit = 1,
+        include = ["documents", "metadatas", "embeddings"]
+    )
+
+    print("Sample entry:")
+    print(f"  id:          {sample['ids'][0]}")
+    print(f"  source:      {sample['metadatas'][0]['source']}")
+    print(f"  chunk_index: {sample['metadatas'][0]['chunk_index']}")
+    print(f"  text:        {sample['documents'][0][:120]}...")
+    print(f"  embedding:   [{sample['embeddings'][0][0]:.6f}, {sample['embeddings'][0][1]:.6f}, ...] ({len(sample['embeddings'][0])} dims)")
+
+
+if __name__ == '__main__':
+    main()
diff --git a/pyproject.toml b/pyproject.toml
index 2481e7a..0b9e40b 100644
--- a/pyproject.toml
+++ b/pyproject.toml
@@ -6,6 +6,7 @@ dependencies = [
     "openai>=1.0.0",
     "python-dotenv>=1.0.0",
     "numpy>=1.26.0",
+    "chromadb>=1.5.9"
 ]
 
 [tool.setuptools]
diff --git a/search.py b/search.py
index 674a4ca..8e94815 100644
--- a/search.py
+++ b/search.py
@@ -1,31 +1,40 @@
-import json
-from utils import chunk_text, cosine_similarity
-from embed import embed_chunks, embed_query
+from embed import embed_query
+import chromadb
+
+client = chromadb.PersistentClient(path="./chroma_db")
 
-def load_embedded_response() -> list[dict]:
-    try:
-        with open('embeddings.json', 'r') as f:
-            return json.load(f)
-    except FileNotFoundError as e:
-        raise FileNotFoundError(f"File not found") 
 
 def search(query: str, top_k: int = 3) -> list[dict]:
-    embedded_response = load_embedded_response()
+    collection = client.get_or_create_collection(name="documents")
     query_vector = embed_query(query)
 
-    scored = [
-        {"text": chunk["text"], "score": cosine_similarity(query_vector, chunk["embedding"])}
-        for chunk in embedded_response
+    results = collection.query(
+        query_embeddings = [query_vector],
+        n_results = top_k,
+        include = ["documents", "metadatas", "distances"]
+    )
+
+    return [
+        {
+            "text": results["documents"][0][i],
+            "source": results["metadatas"][0][i]["source"],
+            "chunk_index": results["metadatas"][0][i]["chunk_index"],
+            "distance": results["distances"][0][i]
+        }
+        for i in range(len(results["documents"][0]))
     ]
 
-    return sorted(scored, key = lambda x: x["score"], reverse = True)[:top_k]
 
 def main():
-    results = search("what foods are good for the heart")
+    query = "what foods are good for the heart"
+    results = search(query)
+
+    print(f"Query: \"{query}\"\n")
     for i, result in enumerate(results):
-        print(f"Result {i + 1} (score: {result['score']:.4f})")
+        print(f"Result {i + 1} (distance: {result['distance']:.4f}) — {result['source']} [chunk {result['chunk_index']}]")
         print(result["text"])
         print()
 
+
 if __name__ == '__main__':
     main()
diff --git a/utils.py b/utils.py
index bc082b2..a04b3d4 100644
--- a/utils.py
+++ b/utils.py
@@ -1,5 +1,22 @@
 import numpy as np
 
+
+def load_document(filepath: str) -> str:
+    try:
+        with open(filepath, 'r') as f:
+            return f.read()
+    except FileNotFoundError as e:
+        raise FileNotFoundError(f"Document not found: {filepath}: {e}")
+
+
+def load_documents(directory: str) -> list[dict]:
+    import os
+    documents = []
+    for filename in filter(lambda f: f.endswith('.txt'), os.listdir(directory)):
+        filepath = os.path.join(directory, filename)
+        documents.append({"filename": filename, "text": load_document(filepath)})
+    return documents
+
 def chunk_text(text: str, chunk_size: int = 300, overlap: int = 50) -> list[str]:
     words = text.split()
     step = chunk_size - overlap