{"id":21715248,"url":"https://github.com/davidwrossiter/langchunk","last_synced_at":"2025-03-20T19:26:57.557Z","repository":{"id":244834384,"uuid":"816406763","full_name":"davidwrossiter/langchunk","owner":"davidwrossiter","description":"Source code for chunking code in multiple different languages","archived":false,"fork":false,"pushed_at":"2024-06-20T14:20:07.000Z","size":6587,"stargazers_count":0,"open_issues_count":0,"forks_count":0,"subscribers_count":1,"default_branch":"main","last_synced_at":"2025-03-14T22:35:13.570Z","etag":null,"topics":["chunking","chunking-algorithm","embedding","llm-context","vectorization"],"latest_commit_sha":null,"homepage":"","language":"JavaScript","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/davidwrossiter.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2024-06-17T17:26:06.000Z","updated_at":"2024-06-18T11:19:23.000Z","dependencies_parsed_at":"2024-06-17T19:45:33.366Z","dependency_job_id":"3cc43ae3-c45f-4523-95ef-76971ca9f472","html_url":"https://github.com/davidwrossiter/langchunk","commit_stats":null,"previous_names":["davidwrossiter/langchunk"],"tags_count":0,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/davidwrossiter%2Flangchunk","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/davidwrossiter%2Flangchunk/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/davidwrossiter%2Flangchunk/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/davidwrossiter%2Flangchunk/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/davidwrossiter","download_url":"https://codeload.github.com/davidwrossiter/langchunk/tar.gz/refs/heads/main","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":244676454,"owners_count":20491828,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["chunking","chunking-algorithm","embedding","llm-context","vectorization"],"created_at":"2024-11-26T00:41:51.401Z","updated_at":"2025-03-20T19:26:57.539Z","avatar_url":"https://github.com/davidwrossiter.png","language":"JavaScript","funding_links":[],"categories":[],"sub_categories":[],"readme":"# Lang chunk\n\n\u003e I created langchunk to chunk entire codebases correctly.\n\nRAG systems rely on data that has been properly chunked and embedded. Langchunk allows you to create high-quality chunks from any codebase including metadata about the file structure of the directory and the content of each file within it.\n\n---\n\n**Current capabilities**\n\n- Allows for chunking of javascript source code.\n- Chunks based on Function declaration, class declaration, variable declaration, and expression statements.\n\n**Steps for future versions**\n\n- Allow for different languages\n- Generate embeddings for vector databases\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fdavidwrossiter%2Flangchunk","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fdavidwrossiter%2Flangchunk","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fdavidwrossiter%2Flangchunk/lists"}