diff --git a/src/code_rag/__pycache__/__init__.cpython-313.pyc b/src/code_rag/__pycache__/__init__.cpython-313.pyc deleted file mode 100644 index d930f3d..0000000 Binary files a/src/code_rag/__pycache__/__init__.cpython-313.pyc and /dev/null differ diff --git a/src/code_rag/__pycache__/doc_tracker.cpython-313.pyc b/src/code_rag/__pycache__/doc_tracker.cpython-313.pyc deleted file mode 100644 index 60978c7..0000000 Binary files a/src/code_rag/__pycache__/doc_tracker.cpython-313.pyc and /dev/null differ diff --git a/src/code_rag/__pycache__/rag.cpython-313.pyc b/src/code_rag/__pycache__/rag.cpython-313.pyc deleted file mode 100644 index 490123b..0000000 Binary files a/src/code_rag/__pycache__/rag.cpython-313.pyc and /dev/null differ diff --git a/src/code_rag/rag.py b/src/code_rag/rag.py index 74dd36c..4e5f23f 100644 --- a/src/code_rag/rag.py +++ b/src/code_rag/rag.py @@ -160,9 +160,7 @@ class RAG: # 3. Process new and modified documents files_to_process = changed_files["new"] + changed_files["modified"] if files_to_process: - chunks, _ = self.process_documents( - files_to_process, text_splitter, self.tracker - ) + chunks, _ = self.process_documents(files_to_process, text_splitter) print(f"Adding {len(chunks)} new chunks to the vector store") vectorstore.add_documents(chunks) else: diff --git a/tests/__pycache__/__init__.cpython-313.pyc b/tests/__pycache__/__init__.cpython-313.pyc deleted file mode 100644 index 0046516..0000000 Binary files a/tests/__pycache__/__init__.cpython-313.pyc and /dev/null differ diff --git a/tests/__pycache__/fixtures.cpython-313.pyc b/tests/__pycache__/fixtures.cpython-313.pyc deleted file mode 100644 index 6ab0623..0000000 Binary files a/tests/__pycache__/fixtures.cpython-313.pyc and /dev/null differ diff --git a/tests/__pycache__/test_doc_tracker.cpython-313-pytest-8.3.5.pyc b/tests/__pycache__/test_doc_tracker.cpython-313-pytest-8.3.5.pyc deleted file mode 100644 index 78d2814..0000000 Binary files a/tests/__pycache__/test_doc_tracker.cpython-313-pytest-8.3.5.pyc and /dev/null differ diff --git a/tests/__pycache__/test_rag.cpython-313-pytest-8.3.5.pyc b/tests/__pycache__/test_rag.cpython-313-pytest-8.3.5.pyc deleted file mode 100644 index 9ce9147..0000000 Binary files a/tests/__pycache__/test_rag.cpython-313-pytest-8.3.5.pyc and /dev/null differ diff --git a/tests/__pycache__/utility.cpython-313.pyc b/tests/__pycache__/utility.cpython-313.pyc deleted file mode 100644 index c57fb38..0000000 Binary files a/tests/__pycache__/utility.cpython-313.pyc and /dev/null differ diff --git a/tests/test_rag.py b/tests/test_rag.py index 6c09d49..e96957f 100644 --- a/tests/test_rag.py +++ b/tests/test_rag.py @@ -23,6 +23,7 @@ def test_process_documents(tracker_file, docs_dir, db_dir, sample_docs, rag_pipe files = [ os.path.join(rag_pipeline.docs_dir, "doc1.txt"), os.path.join(rag_pipeline.docs_dir, "doc2.txt"), + os.path.join(rag_pipeline.docs_dir, "doc3.txt"), ] text_splitter = RecursiveCharacterTextSplitter(chunk_size=1000, chunk_overlap=200) @@ -30,13 +31,12 @@ def test_process_documents(tracker_file, docs_dir, db_dir, sample_docs, rag_pipe chunks, file_chunk_map = rag_pipeline.process_documents(files, text_splitter) # Verify chunks were created - assert len(chunks) >= 2 # At least one chunk per document + assert len(chunks) >= 3 # At least one chunk per document tracker = rag_pipeline.tracker # Verify chunk IDs were tracked for file_path in files: assert file_path in tracker.doc_info - assert "chunk_ids" in tracker.doc_info[file_path] - assert len(tracker.doc_info[file_path]["chunk_ids"]) > 0 + assert len(tracker.doc_info[file_path].chunk_ids) > 0 # Verify metadata in chunks for chunk in chunks: