{"id":22822934,"url":"https://github.com/renardeinside/pyspark-logging-examples","last_synced_at":"2025-07-19T04:34:31.251Z","repository":{"id":108304639,"uuid":"502378621","full_name":"renardeinside/pyspark-logging-examples","owner":"renardeinside","description":"Writing PySpark logs in Apache Spark and Databricks","archived":false,"fork":false,"pushed_at":"2022-06-13T12:56:49.000Z","size":21,"stargazers_count":16,"open_issues_count":0,"forks_count":7,"subscribers_count":1,"default_branch":"main","last_synced_at":"2025-05-31T22:03:51.983Z","etag":null,"topics":["apache-spark","databricks","log4j","logging","logs"],"latest_commit_sha":null,"homepage":"https://polarpersonal.medium.com/writing-pyspark-logs-in-apache-spark-and-databricks-8590c28d1d51","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/renardeinside.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null}},"created_at":"2022-06-11T15:01:09.000Z","updated_at":"2024-10-29T03:18:46.000Z","dependencies_parsed_at":"2023-05-22T06:00:41.081Z","dependency_job_id":null,"html_url":"https://github.com/renardeinside/pyspark-logging-examples","commit_stats":null,"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/renardeinside/pyspark-logging-examples","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/renardeinside%2Fpyspark-logging-examples","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/renardeinside%2Fpyspark-logging-examples/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/renardeinside%2Fpyspark-logging-examples/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/renardeinside%2Fpyspark-logging-examples/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/renardeinside","download_url":"https://codeload.github.com/renardeinside/pyspark-logging-examples/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/renardeinside%2Fpyspark-logging-examples/sbom","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":265889025,"owners_count":23844538,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["apache-spark","databricks","log4j","logging","logs"],"created_at":"2024-12-12T16:13:45.617Z","updated_at":"2025-07-19T04:34:31.244Z","avatar_url":"https://github.com/renardeinside.png","language":"Python","funding_links":[],"categories":[],"sub_categories":[],"readme":"# PySpark logging examples in local environment and on Databricks clusters\n\nThis repo contains examples on how to configure PySpark logs in the local Apache Spark environment and when using Databricks clusters.\n\n[Link to the blogpost with details](https://polarpersonal.medium.com/writing-pyspark-logs-in-apache-spark-and-databricks-8590c28d1d51).\n\n## Local setup\n\nProvide your logging configurations in `conf/local/log4j.properties` and pass this path via `SPARK_CONF_DIR` when initializing the Python session.\n\n## Databricks setup\n\n* Describe your logging configurations in `conf/databricks/driver-log4j.properties`. \n* Provide your `DATABRICKS_CLI_PROFILE` environment variable in the `.env` file\n* Upload the configurations to DBFS via `make upload-log-configuration`\n* Add the init script in the cluster properties\n\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Frenardeinside%2Fpyspark-logging-examples","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Frenardeinside%2Fpyspark-logging-examples","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Frenardeinside%2Fpyspark-logging-examples/lists"}