{"id":18700121,"url":"https://github.com/runekaagaard/py-webkit-html-manipulator","last_synced_at":"2025-11-08T21:30:22.875Z","repository":{"id":31382095,"uuid":"34945161","full_name":"runekaagaard/py-webkit-html-manipulator","owner":"runekaagaard","description":"Automatically exported from code.google.com/p/py-webkit-html-manipulator","archived":false,"fork":false,"pushed_at":"2015-05-02T11:29:36.000Z","size":148,"stargazers_count":1,"open_issues_count":2,"forks_count":0,"subscribers_count":2,"default_branch":"master","last_synced_at":"2024-12-28T05:17:37.928Z","etag":null,"topics":[],"latest_commit_sha":null,"homepage":null,"language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":null,"status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/runekaagaard.png","metadata":{"files":{"readme":"README","changelog":null,"contributing":null,"funding":null,"license":null,"code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null}},"created_at":"2015-05-02T11:24:34.000Z","updated_at":"2018-02-27T03:45:44.000Z","dependencies_parsed_at":"2022-08-17T18:55:18.724Z","dependency_job_id":null,"html_url":"https://github.com/runekaagaard/py-webkit-html-manipulator","commit_stats":null,"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/runekaagaard%2Fpy-webkit-html-manipulator","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/runekaagaard%2Fpy-webkit-html-manipulator/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/runekaagaard%2Fpy-webkit-html-manipulator/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/runekaagaard%2Fpy-webkit-html-manipulator/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/runekaagaard","download_url":"https://codeload.github.com/runekaagaard/py-webkit-html-manipulator/tar.gz/refs/heads/master","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":239561473,"owners_count":19659467,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":[],"created_at":"2024-11-07T11:35:51.217Z","updated_at":"2025-11-08T21:30:22.821Z","avatar_url":"https://github.com/runekaagaard.png","language":"Python","funding_links":[],"categories":[],"sub_categories":[],"readme":"== Welcome to Py Webkit Html Manipulator ==\nThis script allows you to render a webpage on your server and manipulate and \nextract the rendered html. The manipulation is done with\njavascript in the browser using the pyQt Webkit Api.\n\nThe difference from a normal html scraper is that javscript and css also is \nrendered.\n\n== Installation ==\nInstall python and pyQt. On ubuntu you would run:\n\n  sudo apt-get install python python-qt4\n\nIf you make it work on other platforms please let me know how.\n\n== Usage ==\n# Get help\n  ./whm.py --help\n\n# Run it\n  ./whm.py -u 'http://example.com'\n\n# Run it headless. Works only on linux. You need to install xvfb first.\n# On ubuntu run sudo apt-get install xvfb \n  xvfb-run --server-args=\"-screen 0, 640x480x24\" ./whm.py --url='http://example.com' --js-file=whm-example.js\n\n== The format of the js file ==\nIf no --js-file argument is supplied the html for webpage will be outputted.\nIf --js-file argument is present the output will be the content of\nthe variable WebkitHtmlManipulator.result that must be available in the global\nscope.\n\nSee whm-example.js for an example. It adds information about position,\nfont-size, etc. to each element in the dom.\n\n== Contact ==\nRune Kaagaard\nCopenhagen, Denmark\nrumi.kg@gmail.com\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Frunekaagaard%2Fpy-webkit-html-manipulator","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Frunekaagaard%2Fpy-webkit-html-manipulator","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Frunekaagaard%2Fpy-webkit-html-manipulator/lists"}