{"id":16707430,"url":"https://github.com/xiaodaigh/data_manipulation_benchmarks","last_synced_at":"2025-04-10T05:15:48.646Z","repository":{"id":73048511,"uuid":"104734694","full_name":"xiaodaigh/data_manipulation_benchmarks","owner":"xiaodaigh","description":"A set of data manipulation benchmarking code for Julia and R","archived":false,"fork":false,"pushed_at":"2020-02-08T14:59:56.000Z","size":23,"stargazers_count":5,"open_issues_count":3,"forks_count":4,"subscribers_count":4,"default_branch":"master","last_synced_at":"2025-04-10T05:15:42.136Z","etag":null,"topics":["comparison","data-manipulation-prowess","julia","r"],"latest_commit_sha":null,"homepage":"","language":"Julia","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/xiaodaigh.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null}},"created_at":"2017-09-25T10:13:05.000Z","updated_at":"2019-11-18T02:23:39.000Z","dependencies_parsed_at":null,"dependency_job_id":"93a2b18c-ed7a-41d1-b0dd-53af0a8502f0","html_url":"https://github.com/xiaodaigh/data_manipulation_benchmarks","commit_stats":null,"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/xiaodaigh%2Fdata_manipulation_benchmarks","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/xiaodaigh%2Fdata_manipulation_benchmarks/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/xiaodaigh%2Fdata_manipulation_benchmarks/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/xiaodaigh%2Fdata_manipulation_benchmarks/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/xiaodaigh","download_url":"https://codeload.github.com/xiaodaigh/data_manipulation_benchmarks/tar.gz/refs/heads/master","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":248161280,"owners_count":21057556,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["comparison","data-manipulation-prowess","julia","r"],"created_at":"2024-10-12T19:39:30.604Z","updated_at":"2025-04-10T05:15:48.566Z","avatar_url":"https://github.com/xiaodaigh.png","language":"Julia","funding_links":[],"categories":[],"sub_categories":[],"readme":"# Julia vs R data manipulation benchmark suite\nA comparison of data manipulation prowess using synthetic data and the [GE Flight Quest data](https://www.kaggle.com/c/flight/data)\n\n# Set up instructions\n1. Change the settings.csv's data_path to a path that you can write to\n2. Download the 7z file (https://www.kaggle.com/c/flight/download/InitialTrainingSet_rev1.7z) and \n3. Extract it into the folder data_path/InitialTrainingSet_rev1\n\n# Synthetic benchmarks\nAdapted from data.tables' [official benchmarks](https://github.com/Rdatatable/data.table/wiki/Benchmarks-:-Grouping#code-to-reproduce-the-timings-above-)\n\n# \"Real-life\" benchmarks\nUses [GE Flight Quest data](https://www.kaggle.com/c/flight/data), the largest tabular dataset on Kaggle at the time of writing\n\n# Companion post\n[Speed of data manipulations in Julia vs R](https://www.codementor.io/zhuojiadai/speed-of-data-manipulation-in-julia-vs-r-cd7praapv)\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fxiaodaigh%2Fdata_manipulation_benchmarks","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fxiaodaigh%2Fdata_manipulation_benchmarks","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fxiaodaigh%2Fdata_manipulation_benchmarks/lists"}