{"id":19020503,"url":"https://github.com/niravjoshi33/news_crunch","last_synced_at":"2026-04-28T09:30:20.843Z","repository":{"id":199540523,"uuid":"702773340","full_name":"NiravJoshi33/news_crunch","owner":"NiravJoshi33","description":"App to scrape articles data and display in single page","archived":false,"fork":false,"pushed_at":"2024-02-09T10:23:55.000Z","size":629,"stargazers_count":0,"open_issues_count":2,"forks_count":0,"subscribers_count":2,"default_branch":"main","last_synced_at":"2025-01-02T00:27:22.603Z","etag":null,"topics":["data-mining","data-science","gui","webscraping"],"latest_commit_sha":null,"homepage":"","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/NiravJoshi33.png","metadata":{"files":{"readme":"README.md","changelog":"News_Crunch_GUI.py","contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2023-10-10T01:45:49.000Z","updated_at":"2023-10-14T23:30:57.000Z","dependencies_parsed_at":"2023-10-15T20:35:13.128Z","dependency_job_id":"52a3f2df-4bf4-49cc-9d3d-503db5a9a8fd","html_url":"https://github.com/NiravJoshi33/news_crunch","commit_stats":null,"previous_names":["niravjoshi33/news_crunch"],"tags_count":0,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/NiravJoshi33%2Fnews_crunch","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/NiravJoshi33%2Fnews_crunch/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/NiravJoshi33%2Fnews_crunch/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/NiravJoshi33%2Fnews_crunch/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/NiravJoshi33","download_url":"https://codeload.github.com/NiravJoshi33/news_crunch/tar.gz/refs/heads/main","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":240064823,"owners_count":19742389,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["data-mining","data-science","gui","webscraping"],"created_at":"2024-11-08T20:17:19.922Z","updated_at":"2026-04-28T09:30:20.786Z","avatar_url":"https://github.com/NiravJoshi33.png","language":"Python","funding_links":[],"categories":[],"sub_categories":[],"readme":"\n\u003c!-- PROJECT LOGO --\u003e\n\u003cbr /\u003e\n\u003cdiv align=\"center\"\u003e\n  \u003ca href=\"[news_crunch](https://github.com/NiravJoshi33/news_crunch)\"\u003e\n    \u003cimg src=\"https://github.com/NiravJoshi33/news_crunch/blob/main/nc_long_logo.png\" alt=\"Logo\" width=\"500\" height=\"80\"\u003e\n  \u003c/a\u003e\n\n\u003ch3 align=\"center\"\u003eNews Crunch\u003c/h3\u003e\n\n  \u003cp align=\"center\"\u003e\n    An app to scrape data from news websites and display the articles in web GUI. \n    \u003cbr /\u003e\n    \u003ca href=\"https://github.com/NiravJoshi33/news_crunch\"\u003e\u003cstrong\u003eExplore the docs »\u003c/strong\u003e\u003c/a\u003e\n    \u003cbr /\u003e\n    \u003cbr /\u003e\n    \u003ca href=\"https://youtu.be/TkfpN3fg_HM\"\u003eView Demo\u003c/a\u003e\n    ·\n    \u003ca href=\"https://github.com/NiravJoshi33/news_crunch/issues\"\u003eReport Bug\u003c/a\u003e\n    ·\n    \u003ca href=\"https://github.com/NiravJoshi33/news_crunch/issues\"\u003eRequest Feature\u003c/a\u003e\n  \u003c/p\u003e\n\u003c/div\u003e\n\n\n\n\u003c!-- TABLE OF CONTENTS --\u003e\n\u003cdetails\u003e\n  \u003csummary\u003eTable of Contents\u003c/summary\u003e\n  \u003col\u003e\n    \u003cli\u003e\n      \u003ca href=\"#about-the-project\"\u003eAbout The Project\u003c/a\u003e\n      \u003cul\u003e\n        \u003cli\u003e\u003ca href=\"#built-with\"\u003eBuilt With\u003c/a\u003e\u003c/li\u003e\n      \u003c/ul\u003e\n    \u003c/li\u003e\n    \u003cli\u003e\n      \u003ca href=\"#getting-started\"\u003eGetting Started\u003c/a\u003e\n      \u003cul\u003e\n        \u003cli\u003e\u003ca href=\"###prerequisites--Installation\"\u003ePrerequisites \u0026 Installation\u003c/a\u003e\u003c/li\u003e\n      \u003c/ul\u003e\n    \u003c/li\u003e\n    \u003cli\u003e\u003ca href=\"#usage\"\u003eUsage\u003c/a\u003e\u003c/li\u003e\n    \u003cli\u003e\u003ca href=\"#To Do\"\u003eTo Do\u003c/a\u003e\u003c/li\u003e\n    \u003cli\u003e\u003ca href=\"#contributing\"\u003eContributing\u003c/a\u003e\u003c/li\u003e\n    \u003cli\u003e\u003ca href=\"#contact\"\u003eContact\u003c/a\u003e\u003c/li\u003e\n    \u003cli\u003e\u003ca href=\"#acknowledgments\"\u003eAcknowledgments\u003c/a\u003e\u003c/li\u003e\n  \u003c/ol\u003e\n\u003c/details\u003e\n\n\n\n\u003c!-- ABOUT THE PROJECT --\u003e\n## About The Project\n\n![Product Name Screen Shot](https://github.com/NiravJoshi33/news_crunch/blob/main/app_screenshot.png)\n\nThis is an app that scrapes news article details such as title, date, auther etc. from different news websites, processes the data and shows on a single page. \n\nThis app is inspired by [inshorts](https://m.inshorts.com/en/read)\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n\n### Built With\n\n[![forthebadge made-with-python](http://ForTheBadge.com/images/badges/made-with-python.svg)](https://www.python.org/)\n\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n\n\u003c!-- GETTING STARTED --\u003e\n## Getting Started\n\n\n\n### Prerequisites \u0026 Installation\n\nBefore starting, please make sure that following dependencies are installed on your machine\n* [Python](https://www.python.org/downloads/)\n* [pip](https://pypi.org/project/pip/)\n\nAfter the above dependecies are installed, follow below instructions:\n* Clone the repo\n  Clone the repo\n   ```sh\n   git clone https://github.com/NiravJoshi33/news_crunch.git\n   ```\n* Navigate to the project folder using CLI\n* Install other dependecies with following command\n  ````\n  pip install -r requirements.txt\n  ````\n  Wait for the packages to be installed.\n\n\n\u003c!-- USAGE EXAMPLES --\u003e\n## How to Use\n\nFollow the below instructions to run the project\n\n* Run following script\n  ```\n  main.py\n  ```\n* After the script has run, browser should open and display a GUI. In case, it doesn't open, open it manually and open following url\n  ```\n  http://localhost:8501\n  ```\n* By default, a side bar will load with the page. From there, you can deselect any website you don't want to see news from and use the slider to select the number of articles to show.\n\n\u003c!-- ROADMAP --\u003e\n## To Do\n\n- [ ] Resolve Major Bugs with the current Basic Version\n  - [X] Run the app with the single script\n  - [X] OpenSSL Error occuring sometimes\n  - [X] Clean Data before showing in GUI\n    - [X] Dates from all websites in same format\n  - [ ] Inconsistent card size due to different size of thumbs and excerpts\n- [ ] Test app on macOS\n- [ ] Data storage and access from an online database \n\n\nSee the [open issues](https://github.com/NiravJoshi33/news_crunch/issues) for a full list of proposed features (and known issues).\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n\n\u003c!-- CONTRIBUTING --\u003e\n## Contributing\n\nContributions are what make the open source community such an amazing place to learn, inspire, and create. Any contributions you make are **greatly appreciated**.\n\nIf you have a suggestion that would make this better, please fork the repo and create a pull request. You can also simply open an issue with the tag \"enhancement\".\nDon't forget to give the project a star! Thanks again!\n\n1. Fork the Project\n2. Create your Feature Branch (`git checkout -b feature/AmazingFeature`)\n3. Commit your Changes (`git commit -m 'Add some AmazingFeature'`)\n4. Push to the Branch (`git push origin feature/AmazingFeature`)\n5. Open a Pull Request\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\u003c!-- CONTACT --\u003e\n## Contact\n\nNirav Joshi \\\nEmail - niravjoshi3000@gmail.com \\\nProject Link: [https://github.com/NiravJoshi33/news_crunch](https://github.com/NiravJoshi33/news_crunch)\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n\n\u003c!-- ACKNOWLEDGMENTS --\u003e\n## Acknowledgments\n\n* [Scrapy Course - Python Web Scraping for Beginners](https://www.youtube.com/watch?v=mBoX_JCKZTE\u0026pp=ygUNc2NyYXB5IGNvdXJzZQ%3D%3D) by freecodecamp.org\n* [Python Streamlit Full Course](https://www.youtube.com/watch?v=RjiqbTLW9_E\u0026list=PLa6CNrvKM5QU7AjAS90zCMIwi9RTFNIIW)\n* [Best-README-Template](https://github.com/othneildrew/Best-README-Template) by [Othneil Drew](https://github.com/othneildrew)\n* Awesome community on [stackoverflow](https://stackoverflow.com/)\n* [ChatGPT](https://chat.openai.com/) by [OpenAI](https://openai.com/) for some Debugging\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n\n\u003c!-- MARKDOWN LINKS \u0026 IMAGES --\u003e\n\u003c!-- https://www.markdownguide.org/basic-syntax/#reference-style-links --\u003e\n[contributors-shield]: https://img.shields.io/github/contributors/NiravJoshi33/news_crunch.svg?style=for-the-badge\n[contributors-url]: https://github.com/NiravJoshi33/news_crunch/graphs/contributors\n[forks-shield]: https://img.shields.io/github/forks/NiravJoshi33/news_crunch.svg?style=for-the-badge\n[forks-url]: https://github.com/NiravJoshi33/news_crunch/network/members\n[stars-shield]: https://img.shields.io/github/stars/NiravJoshi33/news_crunch.svg?style=for-the-badge\n[stars-url]: https://github.com/NiravJoshi33/news_crunch/stargazers\n[issues-shield]: https://img.shields.io/github/issues/NiravJoshi33/news_crunch.svg?style=for-the-badge\n[issues-url]: https://github.com/NiravJoshi33/news_crunch/issues\n[license-shield]: https://img.shields.io/github/license/NiravJoshi33/news_crunch.svg?style=for-the-badge\n[license-url]: https://github.com/NiravJoshi33/news_crunch/blob/master/LICENSE.txt\n[linkedin-shield]: https://img.shields.io/badge/-LinkedIn-black.svg?style=for-the-badge\u0026logo=linkedin\u0026colorB=555\n[linkedin-url]: https://linkedin.com/in/linkedin_username\n[product-screenshot]: images/screenshot.png\n[Next.js]: https://img.shields.io/badge/next.js-000000?style=for-the-badge\u0026logo=nextdotjs\u0026logoColor=white\n[Next-url]: https://nextjs.org/\n[React.js]: https://img.shields.io/badge/React-20232A?style=for-the-badge\u0026logo=react\u0026logoColor=61DAFB\n[React-url]: https://reactjs.org/\n[Vue.js]: https://img.shields.io/badge/Vue.js-35495E?style=for-the-badge\u0026logo=vuedotjs\u0026logoColor=4FC08D\n[Vue-url]: https://vuejs.org/\n[Angular.io]: https://img.shields.io/badge/Angular-DD0031?style=for-the-badge\u0026logo=angular\u0026logoColor=white\n[Angular-url]: https://angular.io/\n[Svelte.dev]: https://img.shields.io/badge/Svelte-4A4A55?style=for-the-badge\u0026logo=svelte\u0026logoColor=FF3E00\n[Svelte-url]: https://svelte.dev/\n[Laravel.com]: https://img.shields.io/badge/Laravel-FF2D20?style=for-the-badge\u0026logo=laravel\u0026logoColor=white\n[Laravel-url]: https://laravel.com\n[Bootstrap.com]: https://img.shields.io/badge/Bootstrap-563D7C?style=for-the-badge\u0026logo=bootstrap\u0026logoColor=white\n[Bootstrap-url]: https://getbootstrap.com\n[JQuery.com]: https://img.shields.io/badge/jQuery-0769AD?style=for-the-badge\u0026logo=jquery\u0026logoColor=white\n[JQuery-url]: https://jquery.com \n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fniravjoshi33%2Fnews_crunch","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fniravjoshi33%2Fnews_crunch","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fniravjoshi33%2Fnews_crunch/lists"}