{"id":21343693,"url":"https://github.com/catalystcode/streaming-instagram","last_synced_at":"2025-08-15T00:36:16.552Z","repository":{"id":73517189,"uuid":"89634478","full_name":"CatalystCode/streaming-instagram","owner":"CatalystCode","description":"A library for reading social data from Instagram using Spark Streaming.","archived":false,"fork":false,"pushed_at":"2017-06-05T14:27:54.000Z","size":75,"stargazers_count":11,"open_issues_count":0,"forks_count":3,"subscribers_count":14,"default_branch":"master","last_synced_at":"2025-07-12T15:39:49.921Z","etag":null,"topics":["instagram","scala","spark-streaming"],"latest_commit_sha":null,"homepage":null,"language":"Scala","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"mit","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/CatalystCode.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null}},"created_at":"2017-04-27T19:46:36.000Z","updated_at":"2023-03-15T13:17:46.000Z","dependencies_parsed_at":null,"dependency_job_id":"f7037de1-0009-4146-8f05-d4eb2b3fe691","html_url":"https://github.com/CatalystCode/streaming-instagram","commit_stats":null,"previous_names":[],"tags_count":7,"template":false,"template_full_name":null,"purl":"pkg:github/CatalystCode/streaming-instagram","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/CatalystCode%2Fstreaming-instagram","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/CatalystCode%2Fstreaming-instagram/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/CatalystCode%2Fstreaming-instagram/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/CatalystCode%2Fstreaming-instagram/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/CatalystCode","download_url":"https://codeload.github.com/CatalystCode/streaming-instagram/tar.gz/refs/heads/master","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/CatalystCode%2Fstreaming-instagram/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":270505916,"owners_count":24596505,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","status":"online","status_checked_at":"2025-08-14T02:00:10.309Z","response_time":75,"last_error":null,"robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":true,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["instagram","scala","spark-streaming"],"created_at":"2024-11-22T01:14:50.947Z","updated_at":"2025-08-15T00:36:16.543Z","avatar_url":"https://github.com/CatalystCode.png","language":"Scala","readme":"A library for reading social data from [Instagram](http://instagram.com) using Spark Streaming.\n\n[![Travis CI status](https://api.travis-ci.org/CatalystCode/streaming-instagram.svg?branch=master)](https://travis-ci.org/CatalystCode/streaming-instagram)\n\n## Usage example ##\n\nRun a demo via:\n\n```sh\n# set up all the requisite environment variables\nexport INSTAGRAM_AUTH_TOKEN=\"...\"\n\n# compile scala, run tests, build fat jar\nsbt assembly\n\n# run locally\njava -cp target/scala-2.11/streaming-instagram-assembly-0.0.7.jar InstagramDemo standalone\n\n# run on spark\nspark-submit --class InstagramDemo --master local[2] target/scala-2.11/streaming-instagram-assembly-0.0.7.jar spark\n```\n\n## How does it work? ##\n\nInstagram doesn't expose a firehose API so we resort to polling. The InstagramReceiver pings the Instagram API every few\nseconds and pushes any new images into Spark Streaming for further processing.\n\nCurrently, the following ways to read images are supported:\n- by location ([sample data](https://www.instagram.com/explore/locations/213819997/vancouver-british-columbia/))\n- by tag ([sample data](https://www.instagram.com/explore/tags/rose/))\n- by user ([sample data](https://www.instagram.com/viawesome/))\n\n## Release process ##\n\n1. Configure your credentials via the `SONATYPE_USER` and `SONATYPE_PASSWORD` environment variables.\n2. Update `version.sbt`\n3. Enter the SBT shell: `sbt`\n4. Run `sonatypeOpen \"enter staging description here\"`\n5. Run `publishSigned`\n6. Run `sonatypeRelease`\n\n","funding_links":[],"categories":[],"sub_categories":[],"project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fcatalystcode%2Fstreaming-instagram","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fcatalystcode%2Fstreaming-instagram","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fcatalystcode%2Fstreaming-instagram/lists"}