{"id":13436160,"url":"https://github.com/openai/spinningup","last_synced_at":"2025-05-13T21:05:12.620Z","repository":{"id":37431079,"uuid":"156606738","full_name":"openai/spinningup","owner":"openai","description":"An educational resource to help anyone learn deep reinforcement learning.","archived":false,"fork":false,"pushed_at":"2024-08-05T03:30:30.000Z","size":31762,"stargazers_count":10831,"open_issues_count":245,"forks_count":2322,"subscribers_count":235,"default_branch":"master","last_synced_at":"2025-04-28T13:58:49.996Z","etag":null,"topics":[],"latest_commit_sha":null,"homepage":"https://spinningup.openai.com/","language":"Python","has_issues":true,"has_wiki":null,"has_pages":null,"mirror_url":null,"source_name":null,"license":"mit","status":null,"scm":"git","pull_requests_enabled":true,"icon_url":"https://github.com/openai.png","metadata":{"files":{"readme":"readme.md","changelog":null,"contributing":null,"funding":null,"license":"LICENSE","code_of_conduct":null,"threat_model":null,"audit":null,"citation":null,"codeowners":null,"security":null,"support":null,"governance":null,"roadmap":null,"authors":null,"dei":null,"publiccode":null,"codemeta":null}},"created_at":"2018-11-07T20:52:15.000Z","updated_at":"2025-04-28T09:35:04.000Z","dependencies_parsed_at":"2023-02-13T01:15:19.711Z","dependency_job_id":"68518edb-c6fe-49a9-954f-ab7ff834319d","html_url":"https://github.com/openai/spinningup","commit_stats":null,"previous_names":[],"tags_count":3,"template":false,"template_full_name":null,"repository_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/openai%2Fspinningup","tags_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/openai%2Fspinningup/tags","releases_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/openai%2Fspinningup/releases","manifests_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories/openai%2Fspinningup/manifests","owner_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners/openai","download_url":"https://codeload.github.com/openai/spinningup/tar.gz/refs/heads/master","host":{"name":"GitHub","url":"https://github.com","kind":"github","repositories_count":254028536,"owners_count":22002275,"icon_url":"https://github.com/github.png","version":null,"created_at":"2022-05-30T11:31:42.601Z","updated_at":"2022-07-04T15:15:14.044Z","host_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub","repositories_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repositories","repository_names_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/repository_names","owners_url":"https://repos.ecosyste.ms/api/v1/hosts/GitHub/owners"}},"keywords":[],"created_at":"2024-07-31T03:00:44.875Z","updated_at":"2025-05-13T21:05:07.612Z","avatar_url":"https://github.com/openai.png","language":"Python","readme":"**Status:** Maintenance (expect bug fixes and minor updates)\n\nWelcome to Spinning Up in Deep RL! \n==================================\n\nThis is an educational resource produced by OpenAI that makes it easier to learn about deep reinforcement learning (deep RL).\n\nFor the unfamiliar: [reinforcement learning](https://en.wikipedia.org/wiki/Reinforcement_learning) (RL) is a machine learning approach for teaching agents how to solve tasks by trial and error. Deep RL refers to the combination of RL with [deep learning](http://ufldl.stanford.edu/tutorial/).\n\nThis module contains a variety of helpful resources, including:\n\n- a short [introduction](https://spinningup.openai.com/en/latest/spinningup/rl_intro.html) to RL terminology, kinds of algorithms, and basic theory,\n- an [essay](https://spinningup.openai.com/en/latest/spinningup/spinningup.html) about how to grow into an RL research role,\n- a [curated list](https://spinningup.openai.com/en/latest/spinningup/keypapers.html) of important papers organized by topic,\n- a well-documented [code repo](https://github.com/openai/spinningup) of short, standalone implementations of key algorithms,\n- and a few [exercises](https://spinningup.openai.com/en/latest/spinningup/exercises.html) to serve as warm-ups.\n\nGet started at [spinningup.openai.com](https://spinningup.openai.com)!\n\n\nCiting Spinning Up\n------------------\n\nIf you reference or use Spinning Up in your research, please cite:\n\n```\n@article{SpinningUp2018,\n    author = {Achiam, Joshua},\n    title = {{Spinning Up in Deep Reinforcement Learning}},\n    year = {2018}\n}\n```","funding_links":[],"categories":["Reinforcement Learning","Tutorials","**Section 5: Prompt Engineering, Finetuning, and Visual Prompts**","Python","Reinforcement Learning (RL) and Deep Reinforcement Learning (DRL)","Deep Learning"],"sub_categories":["**RLHF (Reinforcement Learning from Human Feedback) \u0026 SFT (Supervised Fine-Tuning)**","RL/DRL Algorithm Implementations and Software Frameworks","2. Documentation"],"project_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fopenai%2Fspinningup","html_url":"https://awesome.ecosyste.ms/projects/github.com%2Fopenai%2Fspinningup","lists_url":"https://awesome.ecosyste.ms/api/v1/projects/github.com%2Fopenai%2Fspinningup/lists"}