{"id":13401502,"url":"https://github.com/kermitt2/grobid","last_synced_at":"2025-05-12T13:09:05.741Z","repository":{"id":4651508,"uuid":"5797013","full_name":"kermitt2/grobid","owner":"kermitt2","description":"A machine learning software for extracting information from scholarly documents","archived":false,"fork":false,"pushed_at":"2025-05-12T07:00:59.000Z","size":1637321,"stargazers_count":4014,"open_issues_count":408,"forks_count":481,"subscribers_count":95,"default_branch":"master","last_synced_at":"2025-05-12T13:08:20.811Z","etag":null,"topics":["bibliographical-references","crf","deep-learning","fulltext","hamburger-to-cow","machine-learning","metadata","pdf","rnn","scientific-articles","transformers"],"latest_commit_sha":null,"homepage":"https://grobid.readthedocs.io","language":"Java","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/kermitt2.png","metadata":{"files":{"readme":"Readme.md","changelog":"CHANGELOG.md","contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null}},"created_at":"2012-09-13T15:48:54.000Z","updated_at":"2025-05-12T08:35:48.000Z","dependencies_parsed_at":"2025-04-23T17:19:36.978Z","dependency_job_id":null,"html_url":"https://github.com/kermitt2/grobid","commit_stats":{"total_commits":2726,"total_committers":63,"mean_commits":43.26984126984127,"dds":0.5818048422597212,"last_synced_commit":"0f57c0d04b70e5de7e227729a15642444bead070"},"previous_names":[],"tags_count":31,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/kermitt2%2Fgrobid","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/kermitt2%2Fgrobid/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/kermitt2%2Fgrobid/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/kermitt2%2Fgrobid/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/kermitt2","download_url":"https://codeload.github.com/kermitt2/grobid/tar.gz/refs/heads/master","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":253745160,"owners_count":21957317,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["bibliographical-references","crf","deep-learning","fulltext","hamburger-to-cow","machine-learning","metadata","pdf","rnn","scientific-articles","transformers"],"created_at":"2024-07-30T19:01:03.514Z","updated_at":"2025-05-12T13:09:00.709Z","avatar_url":"https://github.com/kermitt2.png","language":"Java","funding_links":[],"categories":["Java","Optical Character Recognition Engines and Frameworks","Information extraction","Tools","📋 Scientific Documentation \u0026 Parsing","人工智能","PDF and Document Processing Tools"],"sub_categories":["CTPN [paper:2016](https://arxiv.org/pdf/1609.03605.pdf)","High-Performance Document Processing","Vector Store Tutorials"],"readme":null,"project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fkermitt2%2Fgrobid","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fkermitt2%2Fgrobid","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fkermitt2%2Fgrobid/lists"}