{"id":21151496,"url":"https://github.com/merrvve/pdf-image-extract","last_synced_at":"2025-07-20T21:34:45.906Z","repository":{"id":254756290,"uuid":"846528300","full_name":"merrvve/pdf-image-extract","owner":"merrvve","description":"Command-line tool to extract and save images (JPEG, PNG) from a PDF file or all PDFs in a directory based on the specific byte signatures.","archived":false,"fork":false,"pushed_at":"2024-08-25T20:12:44.000Z","size":4346,"stargazers_count":0,"open_issues_count":0,"forks_count":0,"subscribers_count":1,"default_branch":"main","last_synced_at":"2025-03-14T14:27:55.837Z","etag":null,"topics":["command-line-tool","pdf-extractor","pdf-image-extractor","python"],"latest_commit_sha":null,"homepage":"","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"mit","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/merrvve.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2024-08-23T12:01:20.000Z","updated_at":"2024-08-25T20:21:03.000Z","dependencies_parsed_at":"2024-08-25T22:56:57.895Z","dependency_job_id":"7bc30d72-e66c-4aa3-8fa7-6d9bec24dcce","html_url":"https://github.com/merrvve/pdf-image-extract","commit_stats":null,"previous_names":["merrvve/pdf-image-extract"],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/merrvve/pdf-image-extract","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/merrvve%2Fpdf-image-extract","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/merrvve%2Fpdf-image-extract/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/merrvve%2Fpdf-image-extract/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/merrvve%2Fpdf-image-extract/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/merrvve","download_url":"https://codeload.github.com/merrvve/pdf-image-extract/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/merrvve%2Fpdf-image-extract/sbom","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":266204640,"owners_count":23892366,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["command-line-tool","pdf-extractor","pdf-image-extractor","python"],"created_at":"2024-11-20T10:17:19.152Z","updated_at":"2025-07-20T21:34:45.891Z","avatar_url":"https://github.com/merrvve.png","language":"Python","funding_links":[],"categories":[],"sub_categories":[],"readme":"# PDF IMAGE EXTRACTOR (JPEG AND PNG)\r\n\r\nThis script extracts and saves JPEG and PNG images embedded within PDF files.\r\n\r\nThe script reads PDF files in binary format, searches for embedded JPEG and PNG images\r\nby identifying their unique byte signatures, and saves each detected image into a separate\r\nfile in a designated output directory. The output directory is named after the input PDF file\r\nand is located in the 'results' folder. \r\n\r\n\r\n## Usage:\r\n    python3 bin/main.py input_file.pdf\r\n    python3 bin/main.py path/to/input/files\r\n\r\n## Arguments:\r\n    input_file.pdf (or) path/to/input/files : Path to the PDF files or a single pdf file from which images will be extracted.\r\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fmerrvve%2Fpdf-image-extract","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fmerrvve%2Fpdf-image-extract","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fmerrvve%2Fpdf-image-extract/lists"}