{"id":24143845,"url":"https://github.com/dnbaker/dnlp","last_synced_at":"2026-06-09T12:31:30.468Z","repository":{"id":94818443,"uuid":"136655870","full_name":"dnbaker/dnlp","owner":"dnbaker","description":"A hodgepodge of NLP-related code.","archived":false,"fork":false,"pushed_at":"2018-06-16T13:32:32.000Z","size":37,"stargazers_count":0,"open_issues_count":0,"forks_count":0,"subscribers_count":2,"default_branch":"master","last_synced_at":"2025-03-01T14:33:06.056Z","etag":null,"topics":[],"latest_commit_sha":null,"homepage":"","language":"C++","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"gpl-3.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/dnbaker.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2018-06-08T18:58:57.000Z","updated_at":"2018-11-02T04:59:52.000Z","dependencies_parsed_at":"2023-04-24T06:02:24.773Z","dependency_job_id":null,"html_url":"https://github.com/dnbaker/dnlp","commit_stats":null,"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/dnbaker/dnlp","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/dnbaker%2Fdnlp","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/dnbaker%2Fdnlp/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/dnbaker%2Fdnlp/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/dnbaker%2Fdnlp/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/dnbaker","download_url":"https://codeload.github.com/dnbaker/dnlp/tar.gz/refs/heads/master","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/dnbaker%2Fdnlp/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":286080680,"owners_count":34107865,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2026-05-26T15:22:16.424Z","status":"online","status_checked_at":"2026-06-09T02:00:06.510Z","response_time":63,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":[],"created_at":"2025-01-12T05:45:42.733Z","updated_at":"2026-06-09T12:31:30.463Z","avatar_url":"https://github.com/dnbaker.png","language":"C++","funding_links":[],"categories":[],"sub_categories":[],"readme":"# dnlp\nDaniel's NLP library\n\nThis is a relatively new project. Currently, all that's supported are utilities for iterating over ngrams in text corpuses, and, as of yet, only ASCII is supported.\nThe goal is to reuse this code in a variety of projects.\n\n## parse.h\nParses a text file or a string, iterating efficiently over ngrams by using a circular buffer and short-string-optimized strings.\n\n## testparse.cpp\nSimply puts all ngrams from a file into a hyperloglog and reports its cardinality. This has obvious applications in indexing and approximate counting for natural language processing applications.\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fdnbaker%2Fdnlp","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fdnbaker%2Fdnlp","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fdnbaker%2Fdnlp/lists"}