{"id":16039755,"url":"https://github.com/hpprc/saku","last_synced_at":"2025-06-20T12:34:37.922Z","repository":{"id":44553638,"uuid":"436315041","full_name":"hppRC/saku","owner":"hppRC","description":"A Japanese Sentence Tokenizer written in Rust.","archived":false,"fork":false,"pushed_at":"2022-08-10T08:25:27.000Z","size":48,"stargazers_count":2,"open_issues_count":0,"forks_count":0,"subscribers_count":2,"default_branch":"main","last_synced_at":"2025-05-15T01:40:59.140Z","etag":null,"topics":["japanese","nlp","python-bindings","rust"],"latest_commit_sha":null,"homepage":"https://crates.io/crates/saku","language":"Rust","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"mit","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/hppRC.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null}},"created_at":"2021-12-08T16:24:52.000Z","updated_at":"2022-06-28T13:44:58.000Z","dependencies_parsed_at":"2022-07-20T20:18:49.841Z","dependency_job_id":null,"html_url":"https://github.com/hppRC/saku","commit_stats":null,"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/hppRC/saku","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/hppRC%2Fsaku","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/hppRC%2Fsaku/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/hppRC%2Fsaku/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/hppRC%2Fsaku/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/hppRC","download_url":"https://codeload.github.com/hppRC/saku/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/hppRC%2Fsaku/sbom","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":260945381,"owners_count":23086999,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["japanese","nlp","python-bindings","rust"],"created_at":"2024-10-08T23:07:32.395Z","updated_at":"2025-06-20T12:34:32.900Z","avatar_url":"https://github.com/hppRC.png","language":"Rust","funding_links":[],"categories":[],"sub_categories":[],"readme":"# Saku: Japanese Sentence Tokenizer\n\n**Saku** is a library for splitting Japanese text into sentences based on hand-made rules written in Rust. \\\n**\"割く(saku)\"** means \"spliting something\" in Japanese.\n\n\nThis library is named after a Japanese VTuber [Saku Sasaki / 笹木咲](https://www.youtube.com/channel/UCoztvTULBYd3WmStqYeoHcA).\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fhpprc%2Fsaku","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fhpprc%2Fsaku","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fhpprc%2Fsaku/lists"}