{"id":14982329,"url":"https://github.com/databricks/learningsparkv2","last_synced_at":"2025-05-14T12:09:29.923Z","repository":{"id":37245645,"uuid":"169945599","full_name":"databricks/LearningSparkV2","owner":"databricks","description":"This is the github repo for Learning Spark: Lightning-Fast Data Analytics [2nd Edition]","archived":false,"fork":false,"pushed_at":"2025-01-28T04:30:40.000Z","size":78816,"stargazers_count":1276,"open_issues_count":1,"forks_count":763,"subscribers_count":40,"default_branch":"master","last_synced_at":"2025-04-13T06:15:17.766Z","etag":null,"topics":["apache-spark","delta-lake","mlflow","mllib","spark","spark-mllib","spark-sql","structured-streaming"],"latest_commit_sha":null,"homepage":"https://learning.oreilly.com/library/view/learning-spark-2nd/9781492050032/","language":"Scala","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/databricks.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2019-02-10T05:17:50.000Z","updated_at":"2025-04-11T20:20:15.000Z","dependencies_parsed_at":"2025-02-15T10:11:29.854Z","dependency_job_id":null,"html_url":"https://github.com/databricks/LearningSparkV2","commit_stats":{"total_commits":121,"total_committers":3,"mean_commits":"40.333333333333336","dds":"0.44628099173553715","last_synced_commit":"3db28ef50a0a0ff3ad4a632702289f148d6f246c"},"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/databricks%2FLearningSparkV2","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/databricks%2FLearningSparkV2/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/databricks%2FLearningSparkV2/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/databricks%2FLearningSparkV2/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/databricks","download_url":"https://codeload.github.com/databricks/LearningSparkV2/tar.gz/refs/heads/master","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":248670434,"owners_count":21142904,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["apache-spark","delta-lake","mlflow","mllib","spark","spark-mllib","spark-sql","structured-streaming"],"created_at":"2024-09-24T14:05:12.752Z","updated_at":"2025-04-13T06:15:36.081Z","avatar_url":"https://github.com/databricks.png","language":"Scala","readme":"# Learning Spark 2nd Edition\n\nWelcome to the GitHub repo for Learning Spark 2nd Edition.\n\nChapters [2](chapter2/README.md), [3](chapter3/README.md), [6](chapter6/README.md), and [7](chapter7/README.md) contain stand-alone Spark applications. You can build all the JAR files for each chapter by running the Python script: `python build_jars.py`.\nOr you can cd to the chapter directory and build jars as specified in each README. Also, include `$SPARK_HOME/bin` in `$PATH`  so that you\ndon't have to prefix `SPARK_HOME/bin/spark-submit` for these standalone applications.\n\nFor all the other chapters, we have provided notebooks in the [notebooks](notebooks) folder. We have also included notebook equivalents for a few of the stand-alone Spark applications in the aforementioned chapters.\n\nHave Fun, Cheers!\n","funding_links":[],"categories":[],"sub_categories":[],"project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fdatabricks%2Flearningsparkv2","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fdatabricks%2Flearningsparkv2","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fdatabricks%2Flearningsparkv2/lists"}