{"id":20750328,"url":"https://github.com/bhavanachitragar/data-analysis-using-pyspark","last_synced_at":"2025-06-30T11:34:49.780Z","repository":{"id":231302441,"uuid":"781415232","full_name":"bhavanachitragar/Data-Analysis-using-Pyspark","owner":"bhavanachitragar","description":"Working with pyspark module in python and  using google colab environment in order to apply some queries to the dataset. The dataset consist of two csv files listening.csv and genre.csv. Also,  visualizing query results using matplotlib. ","archived":false,"fork":false,"pushed_at":"2024-04-03T10:54:50.000Z","size":18,"stargazers_count":0,"open_issues_count":0,"forks_count":0,"subscribers_count":1,"default_branch":"main","last_synced_at":"2025-03-11T14:21:25.909Z","etag":null,"topics":["data-analysis","google-colab","pyspark-sql"],"latest_commit_sha":null,"homepage":"","language":"Jupyter Notebook","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/bhavanachitragar.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2024-04-03T10:39:46.000Z","updated_at":"2024-04-03T11:04:04.000Z","dependencies_parsed_at":null,"dependency_job_id":"45114602-4d03-461b-a1c5-8b56e44e998b","html_url":"https://github.com/bhavanachitragar/Data-Analysis-using-Pyspark","commit_stats":null,"previous_names":["bhavanachitragar/data-analysis-using-pyspark"],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/bhavanachitragar/Data-Analysis-using-Pyspark","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/bhavanachitragar%2FData-Analysis-using-Pyspark","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/bhavanachitragar%2FData-Analysis-using-Pyspark/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/bhavanachitragar%2FData-Analysis-using-Pyspark/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/bhavanachitragar%2FData-Analysis-using-Pyspark/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/bhavanachitragar","download_url":"https://codeload.github.com/bhavanachitragar/Data-Analysis-using-Pyspark/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/bhavanachitragar%2FData-Analysis-using-Pyspark/sbom","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":262766169,"owners_count":23361052,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["data-analysis","google-colab","pyspark-sql"],"created_at":"2024-11-17T08:26:49.313Z","updated_at":"2025-06-30T11:34:49.713Z","avatar_url":"https://github.com/bhavanachitragar.png","language":"Jupyter Notebook","funding_links":[],"categories":[],"sub_categories":[],"readme":"# Data Analysis using Pyspark\r\n-------------------------------------------------------------\r\n\r\n- Importing first csv file of our dataset   \r\n- Using pyspark sql data frame      \r\n- Queries to extract useful information\r\n- Importing second csv file of our dataset\r\n- Merging two data frames  and prepare it for more advanced queries\r\n- Visualizing results using matplotlib\r\n \r\n----------------------------------------------------------------\r\n\r\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fbhavanachitragar%2Fdata-analysis-using-pyspark","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fbhavanachitragar%2Fdata-analysis-using-pyspark","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fbhavanachitragar%2Fdata-analysis-using-pyspark/lists"}