{"id":21673642,"url":"https://github.com/agenty/agenty.testdata","last_synced_at":"2026-01-04T12:30:58.028Z","repository":{"id":115857463,"uuid":"174453777","full_name":"Agenty/Agenty.TestData","owner":"Agenty","description":"This project contains the publc test data set to try and learn how to use cloud-based agents in Agenty.","archived":false,"fork":false,"pushed_at":"2022-12-27T10:28:03.000Z","size":7037,"stargazers_count":0,"open_issues_count":0,"forks_count":0,"subscribers_count":2,"default_branch":"master","last_synced_at":"2025-01-25T09:42:03.951Z","etag":null,"topics":["bigdata","datascraping","htmlparser","machine-intelligence","ocr","webdata","webscraping"],"latest_commit_sha":null,"homepage":"https://www.agenty.com","language":"HTML","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"mit","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/Agenty.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2019-03-08T02:19:19.000Z","updated_at":"2022-01-13T11:24:49.000Z","dependencies_parsed_at":null,"dependency_job_id":"99f8fe8e-4cc7-4010-acab-7120c00a1d0d","html_url":"https://github.com/Agenty/Agenty.TestData","commit_stats":null,"previous_names":[],"tags_count":0,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Agenty%2FAgenty.TestData","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Agenty%2FAgenty.TestData/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Agenty%2FAgenty.TestData/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/Agenty%2FAgenty.TestData/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/Agenty","download_url":"https://codeload.github.com/Agenty/Agenty.TestData/tar.gz/refs/heads/master","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":244582770,"owners_count":20476233,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["bigdata","datascraping","htmlparser","machine-intelligence","ocr","webdata","webscraping"],"created_at":"2024-11-25T13:40:15.334Z","updated_at":"2026-01-04T12:30:53.005Z","avatar_url":"https://github.com/Agenty.png","language":"HTML","readme":"# Agenty Test Data\nThis project contains the public test data set to try and learn how to use cloud-based agents in [Agenty](https://www.agenty.com/).\n\n## Web Scraping\nTest data for [web scraping](https://www.agenty.com/products/scraping-agent/)\n### HTML\n- [Ecommerce products list](https://agenty.github.io/Agenty.TestData/scraping/html/ecommerce-product-list.html)\n- [Meta tags](https://agenty.github.io/Agenty.TestData/scraping/html/meta-tags.html)\n- [Simple products list](https://agenty.github.io/Agenty.TestData/scraping/html/simple-products-list.html)\n- [Simple HTML table](https://agenty.github.io/Agenty.TestData/scraping/html/simple-table.html)\n- [HTML table with heading](https://agenty.github.io/Agenty.TestData/scraping/html/table-with-headings.html)\n- [Blog post article with schema](https://agenty.github.io/Agenty.TestData/scraping/html/article-with-schema.html)\n\n## OCR\nTest data for [OCR](https://www.agenty.com/products/ocr-agent/) agent\n### English\n- [GIF](https://raw.githubusercontent.com/Agenty/Agenty.TestData/master/ocr/gif-example.gif)\n- [JPG](https://raw.githubusercontent.com/Agenty/Agenty.TestData/master/ocr/jpeg-example.jpg)\n- [PNG](https://raw.githubusercontent.com/Agenty/Agenty.TestData/master/ocr/png-example.png)\n- [PNG](https://raw.githubusercontent.com/Agenty/Agenty.TestData/master/ocr/english_text.png)\n- [TIFF](https://raw.githubusercontent.com/Agenty/Agenty.TestData/master/ocr/tiff-example.tif)\n\n### French\n\n- [PNG](https://raw.githubusercontent.com/Agenty/Agenty.TestData/master/ocr/french_text.png)\n","funding_links":[],"categories":[],"sub_categories":[],"project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fagenty%2Fagenty.testdata","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fagenty%2Fagenty.testdata","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fagenty%2Fagenty.testdata/lists"}