{"id":18541437,"url":"https://github.com/tensorsofthewall/vidtune","last_synced_at":"2026-03-07T13:32:31.913Z","repository":{"id":252829609,"uuid":"811125914","full_name":"tensorsofthewall/VidTune","owner":"tensorsofthewall","description":"Tailored Music For Your Videos","archived":false,"fork":false,"pushed_at":"2025-03-22T01:03:04.000Z","size":4879,"stargazers_count":2,"open_issues_count":2,"forks_count":1,"subscribers_count":1,"default_branch":"main","last_synced_at":"2025-04-10T11:43:42.402Z","etag":null,"topics":["audiocraft","generative-ai","generative-audio","google-gemini","meta-ai","music-generation","musicgen","streamlit","transformers","video-to-audio","vidtune"],"latest_commit_sha":null,"homepage":"https://huggingface.co/spaces/sandeshb/VidTune-Gradio","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"other","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/tensorsofthewall.png","metadata":{"files":{"readme":"README.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2024-06-06T01:42:57.000Z","updated_at":"2025-03-07T22:05:15.000Z","dependencies_parsed_at":"2025-04-09T18:42:45.323Z","dependency_job_id":"9cf2032e-b34a-4473-9805-c9c235471ac0","html_url":"https://github.com/tensorsofthewall/VidTune","commit_stats":null,"previous_names":["sandesh-bharadwaj/vidtune","tensorsofthewall/vidtune"],"tags_count":0,"template":false,"template_full_name":null,"purl":"pkg:github/tensorsofthewall/VidTune","repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/tensorsofthewall%2FVidTune","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/tensorsofthewall%2FVidTune/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/tensorsofthewall%2FVidTune/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/tensorsofthewall%2FVidTune/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/tensorsofthewall","download_url":"https://codeload.github.com/tensorsofthewall/VidTune/tar.gz/refs/heads/main","sbom_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/tensorsofthewall%2FVidTune/sbom","scorecard":null,"host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":286080680,"owners_count":30215674,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2026-03-07T13:25:55.541Z","status":"ssl_error","status_checked_at":"2026-03-07T13:25:38.596Z","response_time":53,"last_error":"SSL_read: unexpected eof while reading","robots_txt_status":"success","robots_txt_updated_at":"2025-07-24T06:49:26.215Z","robots_txt_url":"https://github.com/robots.txt","online":false,"can_crawl_api":true,"host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":["audiocraft","generative-ai","generative-audio","google-gemini","meta-ai","music-generation","musicgen","streamlit","transformers","video-to-audio","vidtune"],"created_at":"2024-11-06T20:05:05.250Z","updated_at":"2026-03-07T13:32:31.889Z","avatar_url":"https://github.com/tensorsofthewall.png","language":"Python","funding_links":[],"categories":[],"sub_categories":[],"readme":"---\ntitle: VidTune\ncolorFrom: indigo\ncolorTo: pink\nsdk: streamlit\npython_version: 3.9.19\nsdk_version: 1.36.0\nsuggested_hardware: t4-medium\nsuggested_storage: small\napp_file: main.py\npinned: true\npreload_from_hub:\n- facebook/musicgen-small\n- facebook/musicgen-medium\n- facebook/musicgen-large\nshort_description: Generate tailored soundtracks for your videos.\n---\n\n\u003c!-- Improved compatibility of back to top link: See: https://github.com/othneildrew/Best-README-Template/pull/73 --\u003e\n\u003ca id=\"readme-top\"\u003e\u003c/a\u003e\n\u003c!--\n*** Thanks for checking out the Best-README-Template. If you have a suggestion\n*** that would make this better, please fork the repo and create a pull request\n*** or simply open an issue with the tag \"enhancement\".\n*** Don't forget to give the project a star!\n*** Thanks again! Now go create something AMAZING! :D\n--\u003e\n\n\n\n\u003c!-- PROJECT SHIELDS --\u003e\n\u003c!--\n*** I'm using markdown \"reference style\" links for readability.\n*** Reference links are enclosed in brackets [ ] instead of parentheses ( ).\n*** See the bottom of this document for the declaration of the reference variables\n*** for contributors-url, forks-url, etc. This is an optional, concise syntax you may use.\n*** https://www.markdownguide.org/basic-syntax/#reference-style-links\n--\u003e\n[![Contributors][contributors-shield]][contributors-url]\n[![Forks][forks-shield]][forks-url]\n[![Stargazers][stars-shield]][stars-url]\n[![Issues][issues-shield]][issues-url]\n[![AGPL License][license-shield]][license-url]\n[![Sandesh-LinkedIn][sandesh-linkedin-shield]][sandesh-linkedin-url]\n[![Animikh-LinkedIn][animikh-linkedin-shield]][animikh-linkedin-url]\n\n\n\n\u003c!-- PROJECT LOGO --\u003e\n\u003cbr /\u003e\n\u003cdiv align=\"center\"\u003e\n  \u003ca href=\"https://github.com/sandesh-bharadwaj/VidTune\"\u003e\n    \u003cimg src=\"assets/VidTune-Logo-Without-BG.png\" alt=\"Logo\" width=\"80\" height=\"80\"\u003e\n  \u003c/a\u003e\n\n  \u003ch3 align=\"center\"\u003eVidTune\u003c/h3\u003e\n\n  \u003cp align=\"center\"\u003e\n    Tailored soundtracks for your videos\n    \u003cbr /\u003e\n    \u003cbr /\u003e\n    \u003ca href=\"https://github.com/sandesh-bharadwaj/VidTune/issues/new?labels=bug\u0026template=bug-report---.md\"\u003eReport Bug\u003c/a\u003e\n    ·\n    \u003ca href=\"https://github.com/sandesh-bharadwaj/VidTune/issues/new?labels=enhancement\u0026template=feature-request---.md\"\u003eRequest Feature\u003c/a\u003e\n  \u003c/p\u003e\n\u003c/div\u003e\n\n\n\n\u003c!-- TABLE OF CONTENTS --\u003e\n\u003cdetails\u003e\n  \u003csummary\u003eTable of Contents\u003c/summary\u003e\n  \u003col\u003e\n    \u003cli\u003e\n      \u003ca href=\"#about-the-project\"\u003eAbout The Project\u003c/a\u003e\n      \u003cul\u003e\n        \u003cli\u003e\u003ca href=\"#built-with\"\u003eBuilt With\u003c/a\u003e\u003c/li\u003e\n      \u003c/ul\u003e\n    \u003c/li\u003e\n    \u003cli\u003e\n      \u003ca href=\"#hardware-requirements\"\u003eHardware Requirements\u003c/a\u003e\n      \u003cul\u003e\n        \u003cli\u003e\u003ca href=\"#hardwarre-used-for-development-and-testing\"\u003eHardware used for Development and Testing\u003c/a\u003e\u003c/li\u003e\n      \u003c/ul\u003e\n    \u003c/li\u003e\n    \u003cli\u003e\u003ca href=\"#see-vidtune-in-action\"\u003eSee VidTune in action!\u003c/a\u003e\u003c/li\u003e\n    \u003cli\u003e\u003ca href=\"#roadmap\"\u003eRoadmap\u003c/a\u003e\u003c/li\u003e\n    \u003cli\u003e\u003ca href=\"#contributing\"\u003eContributing\u003c/a\u003e\u003c/li\u003e\n    \u003cli\u003e\u003ca href=\"#license\"\u003eLicense\u003c/a\u003e\u003c/li\u003e\n    \u003cli\u003e\u003ca href=\"#contact\"\u003eContact\u003c/a\u003e\u003c/li\u003e\n    \u003cli\u003e\u003ca href=\"#acknowledgments\"\u003eAcknowledgments\u003c/a\u003e\u003c/li\u003e\n  \u003c/ol\u003e\n\u003c/details\u003e\n\n\n\n\u003c!-- ABOUT THE PROJECT --\u003e\n## About The Project\n\n![startup_screen]\n\n**VidTune** is a generative AI application designed to create custom music tailored to your video content. By leveraging advanced AI models for video analysis and music creation, **VidTune** provides an intuitive and seamless experience for generating and integrating music into your videos.\n\n**VidTune** employs two state-of-the-art models for video understanding and music generation:\n1. [**Google Gemini**](https://ai.google.dev/gemini-api) - Google's largest and most capable multimodal AI model.\n2. [**MusicGen**](https://huggingface.co/facebook/musicgen-large) - Meta's text-to-music model, capable of generating high-quality music conditioned on text or audio prompts.\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n\n### Built With\n[![Transformers][Transformers-shield]][Transformers-url]\n[![Google Gemini][Google-Gemini-shield]][Google-Gemini-url]\n[![AudioCraft][AudioCraft-shield]][AudioCraft-url]\n[![MusicGen][MusicGen-shield]][MusicGen-url]\n[![Streamlit][Streamlit-shield]][Streamlit-url]\n\u003c!-- * [![Next][Next.js]][Next-url]\n* [![React][React.js]][React-url]\n* [![Vue][Vue.js]][Vue-url]\n* [![Angular][Angular.io]][Angular-url]\n* [![Svelte][Svelte.dev]][Svelte-url]\n* [![Laravel][Laravel.com]][Laravel-url]\n* [![Bootstrap][Bootstrap.com]][Bootstrap-url]\n* [![JQuery][JQuery.com]][JQuery-url] --\u003e\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n## Hardware Requirements\n\n### Hardware used for Development and Testing\n\n- **CPU:** AMD Ryzen 7 3700X - 8 Cores 16 Threads\n- **GPU:** Nvidia GeForce RTX 4060 Ti 16 GB\n- **RAM:** 64 GB DDR4 @ 3200 MHz\n- **OS:** Linux (WSL | Ubuntu 22.40)\n\nThe above is just used for development and by no means is necessary to run this application. The Minimum Hardware Requirements are given in the next section\n\nWhile VidTune is supported on CPU-only machines, we recommend using a GPU with minimum 16GB of memory for faster results.\n\n\n## See VidTune in action!\n[![Watch the video](https://img.youtube.com/vi/knbQjWZtL3Y/maxresdefault.jpg)](https://youtu.be/knbQjWZtL3Y)\n\n## Running VidTune\nFirst, clone the repository:\n```sh\ngit clone https://github.com/sandesh-bharadwaj/VidTune.git\ncd VidTune\n```\n### Using conda\nIf you're using conda as your virtual environment manager, do the following:\n```\nconda env create -f environment.yml\nconda activate vidtune\n\nstreamlit run main.py\n```\n\n### Using python / pip\n```\npip install -r requirements.txt\nstreamlit run main.py\n```\n\n### Using Docker\n- [Docker](https://docs.docker.com/engine/install/)\n- [Nvidia Docker](https://docs.nvidia.com/datacenter/cloud-native/container-toolkit/latest/install-guide.html#installing-with-apt)\n\nDocker Hub Image: https://hub.docker.com/r/animikhaich/vidtune\n\n```\ndocker run --rm -it --gpus all -p 8003:8003 animikhaich/vidtune\n```\n\n\n\n\u003c!-- ROADMAP --\u003e\n## Roadmap\n- [x] Customized Prompt for Gemini Prompting\n- [x] Flutter version of app for proof-of-concept\n- [x] MusicGen integration\n- [x] Audio Mixing\n- [x] Streamlit app\n- [x] Docker image\n- [ ] OpenVINO-optimized versions of MusicGen for CPU-Only use.\n- [ ] Support for music generation duration \u003e 30 seconds.\n- [ ] Add more settings for controlling generation.\n- [ ] Option to edit music prompts before music generation.\n\n\nSee the [open issues](https://github.com/sandesh-bharadwaj/VIdTune/issues) for a full list of proposed features (and known issues).\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n\n\u003c!-- CONTRIBUTING --\u003e\n## Contributing\n\nIf you have a suggestion that would improve this, please **open an issue** with the tag *\"enhancement\"*.You can also **fork the repo** and create a pull request. Your feedback is greatly appreciated!\nDon't forget to give the project a star! Thanks again!\n\n1. Fork the Project\n2. Create your Feature Branch (`git checkout -b feature/AmazingFeature`)\n3. Commit your Changes (`git commit -m 'Add some AmazingFeature'`)\n4. Push to the Branch (`git push origin feature/AmazingFeature`)\n5. Open a Pull Request\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n\n\u003c!-- LICENSE --\u003e\n## License\n\nDistributed under the CC BY-NC 4.0 License. See [`LICENSE`](./LICENSE) for more information.\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n\n\u003c!-- CONTACT --\u003e\n## Contact\n\nSandesh Bharadwaj - sandesh.bharadwaj97@gmail.com\n\nAnimikh Aich - animikhaich@gmail.com\n\nProject Link: [https://github.com/sandesh-bharadwaj/VidTune](https://github.com/sandesh-bharadwaj/VidTune)\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n\n\u003c!-- ACKNOWLEDGMENTS --\u003e\n## Acknowledgments\n\n* Google.\n* Meta.\n\n\n\u003cp align=\"right\"\u003e(\u003ca href=\"#readme-top\"\u003eback to top\u003c/a\u003e)\u003c/p\u003e\n\n\n\n\u003c!-- MARKDOWN LINKS \u0026 IMAGES --\u003e\n\u003c!-- https://www.markdownguide.org/basic-syntax/#reference-style-links --\u003e\n[contributors-shield]: https://img.shields.io/github/contributors/sandesh-bharadwaj/VidTune.svg?style=for-the-badge\n[contributors-url]: https://github.com/sandesh-bharadwaj/VidTune/graphs/contributors\n[forks-shield]: https://img.shields.io/github/forks/sandesh-bharadwaj/VidTune.svg?style=for-the-badge\n[forks-url]: https://github.com/sandesh-bharadwaj/VidTune/network/members\n[stars-shield]: https://img.shields.io/github/stars/sandesh-bharadwaj/VidTune.svg?style=for-the-badge\n[stars-url]: https://github.com/sandesh-bharadwaj/VidTune/stargazers\n[issues-shield]: https://img.shields.io/github/issues/sandesh-bharadwaj/VidTune.svg?style=for-the-badge\n[issues-url]: https://github.com/sandesh-bharadwaj/VidTune/issues\n[license-shield]: https://img.shields.io/github/license/sandesh-bharadwaj/VidTune.svg?style=for-the-badge\n[license-url]: https://github.com/sandesh-bharadwaj/VidTune/blob/main/LICENSE\n[llama-3-shield]: https://img.shields.io/badge/License-Llama%203-purple.svg?style=for-the-badge\n[llama-3-license]: https://github.com/sandesh-bharadwaj/VidTune/blob/main/LLAMA-3-LICENSE\n[sandesh-linkedin-shield]: https://img.shields.io/badge/-Sandesh_Bharadwaj-black.svg?style=for-the-badge\u0026logo=linkedin\u0026colorB=555\n[sandesh-linkedin-url]: https://linkedin.com/in/sandeshbharadwaj97\n[animikh-linkedin-shield]: https://img.shields.io/badge/-Animikh_Aich-black.svg?style=for-the-badge\u0026logo=linkedin\u0026colorB=555\n[animikh-linkedin-url]: https://linkedin.com/in/animikh-aich\n[startup_screen]: assets/homepage.png\n\n[Python-url]: https://img.shields.io/badge/python-3670A0?style=for-the-badge\u0026logo=python\u0026logoColor=ffdd54\n[Langchain-shield]: https://img.shields.io/badge/LangChain-0.2.12-1C3C3C?style=for-the-badge\u0026logo=langchain\n[Langchain-url]: https://github.com/langchain-ai/langchain\n[Transformers-shield]: https://img.shields.io/badge/Transformers-4.42.4-blue?style=for-the-badge\n[Transformers-url]: https://github.com/huggingface/transformers\n[Optimum-shield]: https://img.shields.io/badge/Optimum-1.21.2-blue?style=for-the-badge\n[Optimum-url]: https://github.com/huggingface/optimum\n[OpenVINO-shield]: https://img.shields.io/badge/OpenVINO-2024.3-purple?style=for-the-badge\n[OpenVINO-url]: https://github.com/openvinotoolkit/openvino\n[Chroma-shield]: https://img.shields.io/badge/Chroma-0.5.5-blue?style=for-the-badge\n[Chroma-url]: https://github.com/chroma-core/chroma\n\n[Google-Gemini-shield]: https://img.shields.io/badge/Google%20Gemini-886FBF?style=for-the-badge\u0026logo=googlegemini\u0026logoColor=fff\n[Google-Gemini-url]: https://ai.google.dev/gemini-api\n[Streamlit-shield]: https://img.shields.io/badge/-Streamlit-FF4B4B?style=for-the-badge\u0026logo=streamlit\u0026logoColor=white\n[Streamlit-url]: https://streamlit.io/\n\n[AudioCraft-shield]: https://img.shields.io/badge/-AudioCraft-blue?style=for-the-badge\u0026logo=Meta\n[AudioCraft-url]: https://audiocraft.metademolab.com/\n[MusicGen-shield]:https://img.shields.io/badge/-MusicGen-blue?style=for-the-badge\u0026logo=Meta\n[MusicGen-url]: https://musicgen.com/\n","project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Ftensorsofthewall%2Fvidtune","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Ftensorsofthewall%2Fvidtune","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Ftensorsofthewall%2Fvidtune/lists"}