{"id":16567923,"url":"https://github.com/drorata/jupyter-spark-python-setup","last_synced_at":"2025-03-05T10:40:30.639Z","repository":{"id":150667622,"uuid":"50347698","full_name":"drorata/Jupyter-Spark-Python-setup","owner":"drorata","description":null,"archived":false,"fork":false,"pushed_at":"2016-01-25T12:00:03.000Z","size":21,"stargazers_count":2,"open_issues_count":0,"forks_count":0,"subscribers_count":2,"default_branch":"master","last_synced_at":"2025-01-15T23:59:20.804Z","etag":null,"topics":[],"latest_commit_sha":null,"homepage":null,"language":"Jupyter Notebook","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/drorata.png","metadata":{"files":{"readme":"readme.md","changelog":null,"contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null}},"created_at":"2016-01-25T11:58:15.000Z","updated_at":"2016-10-13T21:54:13.000Z","dependencies_parsed_at":"2023-04-20T02:24:31.179Z","dependency_job_id":null,"html_url":"https://github.com/drorata/Jupyter-Spark-Python-setup","commit_stats":null,"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/drorata%2FJupyter-Spark-Python-setup","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/drorata%2FJupyter-Spark-Python-setup/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/drorata%2FJupyter-Spark-Python-setup/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/drorata%2FJupyter-Spark-Python-setup/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/drorata","download_url":"https://codeload.github.com/drorata/Jupyter-Spark-Python-setup/tar.gz/refs/heads/master","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":242012392,"owners_count":20057649,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":[],"created_at":"2024-10-11T21:07:48.485Z","updated_at":"2025-03-05T10:40:30.607Z","avatar_url":"https://github.com/drorata.png","language":"Jupyter Notebook","funding_links":[],"categories":[],"sub_categories":[],"readme":"This repository holds my attempts to allow interaction with [Spark](https://spark.apache.org/) on a local machine as well as on a remote cluster using Python from within [Jupyter](http://jupyter.org/).\n\nMain steps:\n\n  * Setup Spark on a local machine (DONE)\n  * Execute simple Spark job(s) on a local machine from Jupyter (DONE)\n  * Load CSV files into spark, using `spark_csv`\n  * Link *local* notebook to a cluster instance of Spark and run jobs remotely. Here, it is important to understand how to setup the notebook where to execute Spark. Should be simple to toggle between the local and remote instances.\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fdrorata%2Fjupyter-spark-python-setup","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fdrorata%2Fjupyter-spark-python-setup","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fdrorata%2Fjupyter-spark-python-setup/lists"}