{"id":15732367,"url":"https://github.com/stopsopa/html-scraper-browserless","last_synced_at":"2025-03-31T03:26:02.828Z","repository":{"id":84269148,"uuid":"140576543","full_name":"stopsopa/html-scraper-browserless","owner":"stopsopa","description":null,"archived":false,"fork":false,"pushed_at":"2023-09-01T23:29:55.000Z","size":571,"stargazers_count":0,"open_issues_count":0,"forks_count":0,"subscribers_count":3,"default_branch":"master","last_synced_at":"2025-02-06T08:13:16.734Z","etag":null,"topics":[],"latest_commit_sha":null,"homepage":null,"language":"JavaScript","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/stopsopa.png","metadata":{"files":{"readme":"Readme.md","changelog":null,"contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2018-07-11T13:07:26.000Z","updated_at":"2022-01-17T15:53:21.000Z","dependencies_parsed_at":"2024-10-24T23:21:29.274Z","dependency_job_id":"ebd18552-e172-4920-9e4e-5e2a3f6502e3","html_url":"https://github.com/stopsopa/html-scraper-browserless","commit_stats":null,"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/stopsopa%2Fhtml-scraper-browserless","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/stopsopa%2Fhtml-scraper-browserless/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/stopsopa%2Fhtml-scraper-browserless/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/stopsopa%2Fhtml-scraper-browserless/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/stopsopa","download_url":"https://codeload.github.com/stopsopa/html-scraper-browserless/tar.gz/refs/heads/master","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":246409891,"owners_count":20772569,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":[],"created_at":"2024-10-04T00:09:06.554Z","updated_at":"2025-03-31T03:26:02.803Z","avatar_url":"https://github.com/stopsopa.png","language":"JavaScript","funding_links":[],"categories":[],"sub_categories":[],"readme":"# Deprecated\n(Deprecated -\u003e use better https://github.com/stopsopa/html-scraper-browserless) Microservice tool to scraping html from \"any\" page\n\nI wouldn't suggest it now - it's just old. But I'll leave it here.\n\n\n\n\n# Installation:\n\n    git clone this repository and go to main directory\n    make install\n    cp config.js.dist config.js\n    \n    # manually change password in config.js for basic auth\n    \n    make start\n    \n\n# Using:\n    \nJust visit:\n\n        http://localhost:8811/generate\n\n    \n# Current execution environment:\n\n    - node v8.9.4\n    - yarn\n    - Docker version 18.03.1-ce, build 9ee9f40  \n    \n# Ping:\n    \n    http://xx.xx.xx.xx:8811/html-scraper-ping\n    http://slowwly.robertomurray.co.uk/delay/32000/url/https://github.com/stopsopa/docker-puppeteer-pdf-generator\n    \n# Useful things (irrelevant now):  \n        \n    docker run -it --rm puppeteer-alpine-generate-pdf /usr/bin/chromium-browser --version        \n        $ Chromium 64.0.3282.168\n        \n    or if you follow node:8-slim : https://github.com/GoogleChrome/puppeteer/blob/master/docs/troubleshooting.md#running-puppeteer-in-docker\n        docker run -it --rm --cap-add=SYS_ADMIN --rm puppeteer-chrome-linux /usr/bin/google-chrome-unstable --version\n            Google Chrome 68.0.3438.3 dev\n        \n    on mac:\n        /Applications/Google\\ Chrome.app/Contents/MacOS/Google\\ Chrome --version\n            $ Google Chrome 66.0.3359.181\n        /Applications/Google\\ Chrome\\ Canary.app/Contents/MacOS/Google\\ Chrome\\ Canary --version\n            $ Google Chrome 69.0.3445.0 canary\n   \n\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fstopsopa%2Fhtml-scraper-browserless","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fstopsopa%2Fhtml-scraper-browserless","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fstopsopa%2Fhtml-scraper-browserless/lists"}