{"id":18191999,"url":"https://github.com/codekow/demo-containerized-dataset","last_synced_at":"2025-04-07T16:28:35.961Z","repository":{"id":201061237,"uuid":"706860677","full_name":"codekow/demo-containerized-dataset","owner":"codekow","description":"How to make your dataset available and immutable via containers","archived":false,"fork":false,"pushed_at":"2024-03-14T22:34:59.000Z","size":10,"stargazers_count":0,"open_issues_count":0,"forks_count":0,"subscribers_count":1,"default_branch":"main","last_synced_at":"2025-02-13T18:49:37.200Z","etag":null,"topics":["containers","data-science","datasets","docker"],"latest_commit_sha":null,"homepage":"","language":null,"has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/codekow.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2023-10-18T18:57:06.000Z","updated_at":"2023-10-18T19:21:55.000Z","dependencies_parsed_at":null,"dependency_job_id":"6b2d146d-8c9b-4417-a6b5-412c49a680ce","html_url":"https://github.com/codekow/demo-containerized-dataset","commit_stats":null,"previous_names":["codekow/demo-containerized-dataset"],"tags_count":0,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/codekow%2Fdemo-containerized-dataset","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/codekow%2Fdemo-containerized-dataset/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/codekow%2Fdemo-containerized-dataset/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/codekow%2Fdemo-containerized-dataset/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/codekow","download_url":"https://codeload.github.com/codekow/demo-containerized-dataset/tar.gz/refs/heads/main","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":247687232,"owners_count":20979423,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["containers","data-science","datasets","docker"],"created_at":"2024-11-03T06:41:59.108Z","updated_at":"2025-04-07T16:28:35.944Z","avatar_url":"https://github.com/codekow.png","language":null,"funding_links":[],"categories":[],"sub_categories":[],"readme":"# Containerized Datasets\n\nThe purpose of this repo show options around serving and\nmaintaining datasets used for training machine learning models\nwith common tools.\n\nWe can use the benefits of containers, immutability and versioning, to support [reproducibility and replicability](https://www.ncbi.nlm.nih.gov/books/NBK547546/) which are key\nto **science**.\n\nDisclaimer: This is one method among many and may not meet your needs or be the best option. This is **a way**, NOT **the way**.\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fcodekow%2Fdemo-containerized-dataset","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fcodekow%2Fdemo-containerized-dataset","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fcodekow%2Fdemo-containerized-dataset/lists"}