{"id":22410868,"url":"https://github.com/runtime-error786/parent-document-retriever","last_synced_at":"2026-05-10T16:02:25.824Z","repository":{"id":254582675,"uuid":"846971536","full_name":"runtime-error786/Parent-Document-Retriever","owner":"runtime-error786","description":null,"archived":false,"fork":false,"pushed_at":"2024-08-24T13:38:28.000Z","size":658,"stargazers_count":2,"open_issues_count":0,"forks_count":0,"subscribers_count":1,"default_branch":"main","last_synced_at":"2025-06-25T02:44:14.851Z","etag":null,"topics":["huggingface-transformers","langchain","llama3-meta-ai"],"latest_commit_sha":null,"homepage":"","language":"Jupyter Notebook","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/runtime-error786.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2024-08-24T13:34:04.000Z","updated_at":"2025-04-25T02:34:20.000Z","dependencies_parsed_at":"2024-08-24T14:57:51.037Z","dependency_job_id":null,"html_url":"https://github.com/runtime-error786/Parent-Document-Retriever","commit_stats":null,"previous_names":["runtime-error786/parent-document-retriever"],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/runtime-error786/Parent-Document-Retriever","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/runtime-error786%2FParent-Document-Retriever","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/runtime-error786%2FParent-Document-Retriever/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/runtime-error786%2FParent-Document-Retriever/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/runtime-error786%2FParent-Document-Retriever/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/runtime-error786","download_url":"https://codeload.github.com/runtime-error786/Parent-Document-Retriever/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/runtime-error786%2FParent-Document-Retriever/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":274195497,"owners_count":25239147,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-09-08T02:00:09.813Z","response_time":121,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["huggingface-transformers","langchain","llama3-meta-ai"],"created_at":"2024-12-05T13:11:56.273Z","updated_at":"2026-05-10T16:02:20.783Z","avatar_url":"https://github.com/runtime-error786.png","language":"Jupyter Notebook","funding_links":[],"categories":[],"sub_categories":[],"readme":"# Parent Document Retriever\n\nThis project demonstrates how to load, process, and retrieve information from PDF documents using LangChain. The script processes PDF files, splits them into chunks, embeds the text, and enables question-answering (QA) capabilities through a retrieval system.\n\n## Features\n\n- **PDF Document Loading**: Load and process PDF documents from a specified folder.\n- **Text Splitting**: Break down large documents into smaller chunks for efficient processing.\n- **Embedding**: Use HuggingFace's sentence transformer model to embed document chunks.\n- **Vector Store**: Store the embedded chunks in a vector store (Chroma) for efficient retrieval.\n- **Retrieval System**: Retrieve relevant information from documents using LangChain's ParentDocumentRetriever.\n- **Question Answering**: Perform QA on the documents using the Ollama language model.\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fruntime-error786%2Fparent-document-retriever","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fruntime-error786%2Fparent-document-retriever","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fruntime-error786%2Fparent-document-retriever/lists"}