{"id":13415174,"url":"https://github.com/datahub-project/datahub","last_synced_at":"2026-04-02T10:45:05.691Z","repository":{"id":37026743,"uuid":"46398090","full_name":"datahub-project/datahub","owner":"datahub-project","description":"The Metadata Platform for your Data and AI Stack","archived":false,"fork":false,"pushed_at":"2025-05-12T14:12:22.000Z","size":409113,"stargazers_count":10585,"open_issues_count":499,"forks_count":3108,"subscribers_count":255,"default_branch":"master","last_synced_at":"2025-05-12T14:31:01.368Z","etag":null,"topics":["data-catalog","data-discovery","data-governance","datahub","metadata"],"latest_commit_sha":null,"homepage":"https://datahub.com","language":"Java","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"apache-2.0","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/datahub-project.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":"docs/CONTRIBUTING.md","funding":null,"license":"LICENSE","code_of_conduct":"docs/CODE_OF_CONDUCT.md","threat_model":null,"audit":null,"citation":null,"codeowners":"CODEOWNERS","security":"SECURITY.md","support":null,"governance":null,"roadmap":"docs/roadmap.md","authors":null,"dei":null,"publiccode":null,"codemeta":null,"zenodo":null}},"created_at":"2015-11-18T05:47:40.000Z","updated_at":"2025-05-12T14:02:08.000Z","dependencies_parsed_at":"2023-09-22T01:20:52.306Z","dependency_job_id":"cdff2be5-aa4e-4088-bfc1-43b722949e19","html_url":"https://github.com/datahub-project/datahub","commit_stats":{"total_commits":9138,"total_committers":538,"mean_commits":"16.985130111524164","dds":0.8870650032829941,"last_synced_commit":"8f40229da2469b7c60864616149b67e467645cd2"},"previous_names":["linkedin/datahub","linkedin/wherehows"],"tags_count":112,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/datahub-project%2Fdatahub","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/datahub-project%2Fdatahub/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/datahub-project%2Fdatahub/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/datahub-project%2Fdatahub/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/datahub-project","download_url":"https://codeload.github.com/datahub-project/datahub/tar.gz/refs/heads/master","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":253755800,"owners_count":21959085,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["data-catalog","data-discovery","data-governance","datahub","metadata"],"created_at":"2024-07-30T21:00:44.536Z","updated_at":"2026-02-06T02:19:26.773Z","avatar_url":"https://github.com/datahub-project.png","language":"Java","readme":"\u003c!--HOSTED_DOCS_ONLY\nimport useBaseUrl from '@docusaurus/useBaseUrl';\n\nexport const Logo = (props) =\u003e {\n  return (\n    \u003cdiv style={{ display: \"flex\", justifyContent: \"center\", padding: \"20px\", height: \"190px\" }}\u003e\n      \u003cimg\n        alt=\"DataHub Logo\"\n        src=\"https://raw.githubusercontent.com/datahub-project/static-assets/main/imgs/datahub-logo-color-mark.svg\"\n        {...props}\n      /\u003e\n    \u003c/div\u003e\n  );\n};\n\n\u003cLogo /\u003e\n\n\u003c!--\nHOSTED_DOCS_ONLY--\u003e\n\u003cp align=\"center\"\u003e\n\u003ca href=\"https://datahubproject.io\"\u003e\n\u003cimg alt=\"DataHub\" src=\"https://raw.githubusercontent.com/datahub-project/static-assets/main/imgs/datahub-logo-color-mark.svg\" height=\"150\" /\u003e\n\u003c/a\u003e\n\u003c/p\u003e\n\u003c!-- --\u003e\n\n# DataHub: The Data Discovery Platform for the Modern Data Stack\n\n### Built with ❤️ by \u003cimg src=\"https://datahubproject.io/img/acryl-logo-light-mark.png\" width=\"20\"/\u003e [Acryl Data](https://acryldata.io) and \u003cimg src=\"https://datahubproject.io/img/LI-In-Bug.png\" width=\"20\"/\u003e [LinkedIn](https://engineering.linkedin.com)\n\n\u003cdiv\u003e\n  \u003ca target=\"_blank\" href=\"https://github.com/datahub-project/datahub/blob/master/LICENSE\"\u003e\n    \u003cimg alt=\"Apache 2.0 License\" src=\"https://img.shields.io/badge/License-Apache_2.0-blue.svg?label=license\u0026labelColor=133554\u0026color=1890ff\" /\u003e\u003c/a\u003e\n  \u003ca target=\"_blank\" href=\"https://pypi.org/project/acryl-datahub/\"\u003e\n    \u003cimg alt=\"PyPI\" src=\"https://img.shields.io/pypi/dm/acryl-datahub?label=downloads\u0026labelColor=133554\u0026color=1890ff\" /\u003e\u003c/a\u003e\n  \u003ca target=\"_blank\" href=\"https://github.com/datahub-project/datahub/pulse\"\u003e\n    \u003cimg alt=\"GitHub commit activity\" src=\"https://img.shields.io/github/commit-activity/m/datahub-project/datahub?label=commits\u0026labelColor=133554\u0026color=1890ff\" /\u003e\u003c/a\u003e\n  \u003cbr /\u003e\n  \u003ca target=\"_blank\" href=\"https://pages.acryl.io/slack?utm_source=github\u0026utm_medium=readme\u0026utm_campaign=github_readme\"\u003e\n    \u003cimg alt=\"Slack\" src=\"https://img.shields.io/badge/slack-join_community-red.svg?logo=slack\u0026labelColor=133554\u0026color=1890ff\" /\u003e\u003c/a\u003e\n  \u003ca href=\"https://www.youtube.com/channel/UC3qFQC5IiwR5fvWEqi_tJ5w\"\u003e\n    \u003cimg alt=\"YouTube\" src=\"https://img.shields.io/youtube/channel/subscribers/UC3qFQC5IiwR5fvWEqi_tJ5w?style=flat\u0026logo=youtube\u0026label=subscribers\u0026labelColor=133554\u0026color=1890ff\"/\u003e\u003c/a\u003e\n  \u003ca href=\"https://blog.datahubproject.io/\"\u003e\n    \u003cimg alt=\"Medium\" src=\"https://img.shields.io/badge/blog-DataHub-red.svg?style=flat\u0026logo=medium\u0026logoColor=white\u0026labelColor=133554\u0026color=1890ff\" /\u003e\u003c/a\u003e\n  \u003ca href=\"https://x.com/datahubproject\"\u003e\n    \u003cimg alt=\"X (formerly Twitter) Follow\" src=\"https://img.shields.io/badge/follow-datahubproject-red.svg?style=flat\u0026logo=x\u0026labelColor=133554\u0026color=1890ff\" /\u003e\u003c/a\u003e\n\u003c/div\u003e\n\n---\n\n### 🏠 Docs: [datahubproject.io](https://datahubproject.io/docs)\n\n[Quickstart](https://datahubproject.io/docs/quickstart) |\n[Features](https://datahubproject.io/docs/) |\n[Roadmap](https://feature-requests.datahubproject.io/roadmap) |\n[Adoption](#adoption) |\n[Demo](https://demo.datahubproject.io/) |\n[Town Hall](https://datahubproject.io/docs/townhalls)\n\n---\n\n\u003e 📣 DataHub Town Hall is the 4th Thursday at 9am US PT of every month - [add it to your calendar!](https://rsvp.datahubproject.io/)\n\u003e\n\u003e - Town-hall Zoom link: [zoom.datahubproject.io](https://zoom.datahubproject.io)\n\u003e - [Meeting details](docs/townhalls.md) \u0026 [past recordings](docs/townhall-history.md)\n\n\u003e ✨ DataHub Community Highlights:\n\u003e\n\u003e - Read our Monthly Project Updates [here](https://blog.datahubproject.io/tagged/project-updates).\n\u003e - Bringing The Power Of The DataHub Real-Time Metadata Graph To Everyone At Acryl Data: [Data Engineering Podcast](https://www.dataengineeringpodcast.com/acryl-data-datahub-metadata-graph-episode-230/)\n\u003e - Check out our most-read blog post, [DataHub: Popular Metadata Architectures Explained](https://engineering.linkedin.com/blog/2020/datahub-popular-metadata-architectures-explained) @ LinkedIn Engineering Blog.\n\u003e - Join us on [Slack](docs/slack.md)! Ask questions and keep up with the latest announcements.\n\n## Introduction\n\nDataHub is an open-source data catalog for the modern data stack. Read about the architectures of different metadata systems and why DataHub excels [here](https://engineering.linkedin.com/blog/2020/datahub-popular-metadata-architectures-explained). Also read our\n[LinkedIn Engineering blog post](https://engineering.linkedin.com/blog/2019/data-hub), check out our [Strata presentation](https://speakerdeck.com/shirshanka/the-evolution-of-metadata-linkedins-journey-strata-nyc-2019) and watch our [Crunch Conference Talk](https://www.youtube.com/watch?v=OB-O0Y6OYDE). You should also visit [DataHub Architecture](docs/architecture/architecture.md) to get a better understanding of how DataHub is implemented.\n\n## Features \u0026 Roadmap\n\nCheck out DataHub's [Features](docs/features.md) \u0026 [Roadmap](https://feature-requests.datahubproject.io/roadmap).\n\n## Demo and Screenshots\n\nThere's a [hosted demo environment](https://demo.datahubproject.io/) courtesy of [Acryl Data](https://acryldata.io) where you can explore DataHub without installing it locally.\n\n## Quickstart\n\nPlease follow the [DataHub Quickstart Guide](https://datahubproject.io/docs/quickstart) to run DataHub locally using [Docker](https://docker.com).\n\n## Development\n\nIf you're looking to build \u0026 modify datahub please take a look at our [Development Guide](https://datahubproject.io/docs/developers).\n\n\u003cp align=\"center\"\u003e\n\u003ca href=\"https://demo.datahubproject.io/\"\u003e\n  \u003cimg width=\"70%\"  src=\"https://raw.githubusercontent.com/datahub-project/static-assets/main/imgs/entity.png\"/\u003e\n\u003c/a\u003e\n\u003c/p\u003e\n\n## Source Code and Repositories\n\n- [datahub-project/datahub](https://github.com/datahub-project/datahub): This repository contains the complete source code for DataHub's metadata model, metadata services, integration connectors and the web application.\n- [acryldata/datahub-actions](https://github.com/acryldata/datahub-actions): DataHub Actions is a framework for responding to changes to your DataHub Metadata Graph in real time.\n- [acryldata/datahub-helm](https://github.com/acryldata/datahub-helm): Repository of helm charts for deploying DataHub on a Kubernetes cluster\n- [acryldata/meta-world](https://github.com/acryldata/meta-world): A repository to store recipes, custom sources, transformations and other things to make your DataHub experience magical\n- [dbt-impact-action](https://github.com/acryldata/dbt-impact-action) : This repository contains a github action for commenting on your PRs with a summary of the impact of changes within a dbt project\n- [datahub-tools](https://github.com/makenotion/datahub-tools) : Additional python tools to interact with the DataHub GraphQL endpoints, built by Notion\n- [business-glossary-sync-action](https://github.com/acryldata/business-glossary-sync-action) : This repository contains a github action that opens PRs to update your business glossary yaml file.\n\n## Releases\n\nSee [Releases](https://github.com/datahub-project/datahub/releases) page for more details. We follow the [SemVer Specification](https://semver.org) when versioning the releases and adopt the [Keep a Changelog convention](https://keepachangelog.com/) for the changelog format.\n\n## Contributing\n\nWe welcome contributions from the community. Please refer to our [Contributing Guidelines](docs/CONTRIBUTING.md) for more details. We also have a [contrib](contrib) directory for incubating experimental features.\n\n## Community\n\nJoin our [Slack workspace](https://pages.acryl.io/slack?utm_source=github\u0026utm_medium=readme\u0026utm_campaign=github_readme) for discussions and important announcements. You can also find out more about our upcoming [town hall meetings](docs/townhalls.md) and view past recordings.\n\n## Security\n\nSee [Security Stance](docs/SECURITY_STANCE.md) for information on DataHub's Security.\n\n## Adoption\n\nHere are the companies that have officially adopted DataHub. Please feel free to add yours to the list if we missed it.\n\n- [ABLY](https://ably.team/)\n- [Adevinta](https://www.adevinta.com/)\n- [Banksalad](https://www.banksalad.com)\n- [Cabify](https://cabify.tech/)\n- [ClassDojo](https://www.classdojo.com/)\n- [Coursera](https://www.coursera.org/)\n- [CVS Health](https://www.cvshealth.com/)\n- [DefinedCrowd](http://www.definedcrowd.com)\n- [DFDS](https://www.dfds.com/)\n- [Digital Turbine](https://www.digitalturbine.com/)\n- [Expedia Group](http://expedia.com)\n- [Experius](https://www.experius.nl)\n- [Geotab](https://www.geotab.com)\n- [Grofers](https://grofers.com)\n- [Haibo Technology](https://www.botech.com.cn)\n- [hipages](https://hipages.com.au/)\n- [inovex](https://www.inovex.de/)\n- [Inter\u0026Co](https://inter.co/)\n- [IOMED](https://iomed.health)\n- [Klarna](https://www.klarna.com)\n- [LinkedIn](http://linkedin.com)\n- [Moloco](https://www.moloco.com/en)\n- [N26](https://n26brasil.com/)\n- [Optum](https://www.optum.com/)\n- [Peloton](https://www.onepeloton.com)\n- [PITS Global Data Recovery Services](https://www.pitsdatarecovery.net/)\n- [Razer](https://www.razer.com)\n- [Rippling](https://www.rippling.com/)\n- [Showroomprive](https://www.showroomprive.com/)\n- [SpotHero](https://spothero.com)\n- [Stash](https://www.stash.com)\n- [Shanghai HuaRui Bank](https://www.shrbank.com)\n- [s7 Airlines](https://www.s7.ru/)\n- [ThoughtWorks](https://www.thoughtworks.com)\n- [TypeForm](http://typeform.com)\n- [Udemy](https://www.udemy.com/)\n- [Uphold](https://uphold.com)\n- [Viasat](https://viasat.com)\n- [Wealthsimple](https://www.wealthsimple.com)\n- [Wikimedia](https://www.wikimedia.org)\n- [Wolt](https://wolt.com)\n- [Zynga](https://www.zynga.com)\n\n## Select Articles \u0026 Talks\n\n- [DataHub Blog](https://blog.datahubproject.io/)\n- [DataHub YouTube Channel](https://www.youtube.com/channel/UC3qFQC5IiwR5fvWEqi_tJ5w)\n- [Optum: Data Mesh via DataHub](https://opensource.optum.com/blog/2022/03/23/data-mesh-via-datahub)\n- [Saxo Bank: Enabling Data Discovery in Data Mesh](https://medium.com/datahub-project/enabling-data-discovery-in-a-data-mesh-the-saxo-journey-451b06969c8f)\n- [Bringing The Power Of The DataHub Real-Time Metadata Graph To Everyone At Acryl Data](https://www.dataengineeringpodcast.com/acryl-data-datahub-metadata-graph-episode-230/)\n- [DataHub: Popular Metadata Architectures Explained](https://engineering.linkedin.com/blog/2020/datahub-popular-metadata-architectures-explained)\n- [Driving DataOps Culture with LinkedIn DataHub](https://www.youtube.com/watch?v=ccsIKK9nVxk) @ [DataOps Unleashed 2021](https://dataopsunleashed.com/#shirshanka-session)\n- [The evolution of metadata: LinkedIn’s story](https://speakerdeck.com/shirshanka/the-evolution-of-metadata-linkedins-journey-strata-nyc-2019) @ [Strata Data Conference 2019](https://conferences.oreilly.com/strata/strata-ny-2019.html)\n- [Journey of metadata at LinkedIn](https://www.youtube.com/watch?v=OB-O0Y6OYDE) @ [Crunch Data Conference 2019](https://crunchconf.com/2019)\n- [DataHub Journey with Expedia Group](https://www.youtube.com/watch?v=ajcRdB22s5o)\n- [Data Discoverability at SpotHero](https://www.slideshare.net/MaggieHays/data-discoverability-at-spothero)\n- [Data Catalogue — Knowing your data](https://medium.com/albert-franzi/data-catalogue-knowing-your-data-15f7d0724900)\n- [DataHub: A Generalized Metadata Search \u0026 Discovery Tool](https://engineering.linkedin.com/blog/2019/data-hub)\n- [Open sourcing DataHub: LinkedIn’s metadata search and discovery platform](https://engineering.linkedin.com/blog/2020/open-sourcing-datahub--linkedins-metadata-search-and-discovery-p)\n- [Emerging Architectures for Modern Data Infrastructure](https://future.com/emerging-architectures-for-modern-data-infrastructure-2020/)\n\nSee the full list [here](docs/links.md).\n\n## License\n\n[Apache License 2.0](./LICENSE).\n","funding_links":[],"categories":["Java","其他_机器学习与深度学习","数据中台","hacktoberfest","📂 Additional Sections","新项目脚手架","GenAI Readiness Features","Model, Data and Experiment Management","🔐 Data Privacy \u0026 Governance","大数据","Data","⚙️ Data Engineering"],"sub_categories":["3. Open-source Projects","Data Quality, Observability \u0026 Governance","📰 Blogs","Catalog","Tools"],"project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fdatahub-project%2Fdatahub","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fdatahub-project%2Fdatahub","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fdatahub-project%2Fdatahub/lists"}