{"id":13627560,"url":"https://skylion007.github.io/OpenWebTextCorpus/","last_synced_at":"2025-04-17T00:31:54.085Z","repository":{"id":48760803,"uuid":"184109202","full_name":"Skylion007/OpenWebTextCorpus","owner":"Skylion007","description":null,"archived":false,"fork":false,"pushed_at":"2024-03-31T16:38:50.000Z","size":13,"stargazers_count":21,"open_issues_count":0,"forks_count":2,"subscribers_count":2,"default_branch":"master","last_synced_at":"2025-04-10T17:19:37.591Z","etag":null,"topics":[],"latest_commit_sha":null,"homepage":null,"language":null,"has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/Skylion007.png","metadata":{"files":{"readme":null,"changelog":null,"contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2019-04-29T16:51:05.000Z","updated_at":"2024-06-30T08:46:02.000Z","dependencies_parsed_at":"2024-01-17T07:36:06.040Z","dependency_job_id":"5ee6be3f-688f-4d15-84a5-ae0d4fc38970","html_url":"https://github.com/Skylion007/OpenWebTextCorpus","commit_stats":null,"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Skylion007%2FOpenWebTextCorpus","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Skylion007%2FOpenWebTextCorpus/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Skylion007%2FOpenWebTextCorpus/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Skylion007%2FOpenWebTextCorpus/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/Skylion007","download_url":"https://codeload.github.com/Skylion007/OpenWebTextCorpus/tar.gz/refs/heads/master","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":249289491,"owners_count":21244966,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":[],"created_at":"2024-08-01T22:00:35.698Z","updated_at":"2025-04-17T00:31:54.072Z","avatar_url":"https://github.com/Skylion007.png","language":null,"funding_links":[],"categories":["Pre-training Corpora","NLP语料和数据集","Datasets \u0026 Content Sources","Datasets \u0026 Data Prep"],"sub_categories":["General Pre-training Corpora","大语言对话模型及数据"],"readme":null,"project_url":"https://awesome.ecosyste.ms/api/v1/projects/skylion007.github.io%2FOpenWebTextCorpus%2F","html_url":"https://awesome.ecosyste.ms/projects/skylion007.github.io%2FOpenWebTextCorpus%2F","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/skylion007.github.io%2FOpenWebTextCorpus%2F/lists"}