Awesome Reinforcement Learning Library
RL Library
RL Accelerated Environment
Star |
Last Update |
Name |
Backend |
![GitHub stars](https://camo.githubusercontent.com/7004f913c042ab2b8cfa9e5eb42e40c4476ed77576ad005ea3b2a244b54e8dbd/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f7261792d70726f6a6563742f726179) |
![GitHub last commit](https://camo.githubusercontent.com/c7075c0102a09c2bd48f165d7a92cbd21fdaedbd96dc3cbeff16c5c6192af26f/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f7261792d70726f6a6563742f7261793f6c6162656c3d6c617374253230757064617465) |
ray |
pytorch, tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/417ee070db2e8444d2d4635eac1d3c9b9c17a699e13147c5b301179898803db9/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6f70656e61692f626173656c696e6573) |
![GitHub last commit](https://camo.githubusercontent.com/5880183e79207a42135a82a8c6253115715f28da2bd637a1d2762114bdbac4d5/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6f70656e61692f626173656c696e65733f6c6162656c3d6c617374253230757064617465) |
baselines |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/e7e06bdb3ae8794ff445988cd23be545be1c0fceac07864daba6d5cf9a691af9/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f676f6f676c652f646f70616d696e65) |
![GitHub last commit](https://camo.githubusercontent.com/4c4b02d7642237fcc78a96ec535b6ea899fff0135230117e3c21bd2ef5ce00d4/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f676f6f676c652f646f70616d696e653f6c6162656c3d6c617374253230757064617465) |
dopamine |
tensorflow-2.x, tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/7a6d6bb6c4919bfed0055f4205c808902656a88ed1a4ffb9186bdaa4d80a3153/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f74656e736f726c617965722f54656e736f724c61796572) |
![GitHub last commit](https://camo.githubusercontent.com/2680503de65c03f8ca316def6afe33c1fba8758d892f1a8f975ddde10429de06/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f74656e736f726c617965722f54656e736f724c617965723f6c6162656c3d6c617374253230757064617465) |
TensorLayer |
tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/0246bfc9ef0b5ba6f0aeab585c1e5be45a759f06404074d7a3d4247f027e6e5a/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6f70656e61692f7370696e6e696e677570) |
![GitHub last commit](https://camo.githubusercontent.com/1b264a12072e9b8fa62f12c189dd5bdadeaa0d6fb28612624973269b735e974d/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6f70656e61692f7370696e6e696e6775703f6c6162656c3d6c617374253230757064617465) |
spinningup |
pytorch, tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/b90756012fa83a4bb0daf7c3fce39c75a13577e6b1062c929cbe1522e4209b06/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6b657261732d726c2f6b657261732d726c) |
![GitHub last commit](https://camo.githubusercontent.com/f60af699dabee4b3896a2bb653d782a7579134ee8b4a3839ed357bc59fde2aef/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6b657261732d726c2f6b657261732d726c3f6c6162656c3d6c617374253230757064617465) |
keras-rl |
keras |
![GitHub stars](https://camo.githubusercontent.com/b08ba35f59df8bc0090d12028e16f44ff5619b9fc0a5fb94533490f33faa69fd/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f7468752d6d6c2f7469616e73686f75) |
![GitHub last commit](https://camo.githubusercontent.com/2523b54a091cb5f9cb6c2c3e66d05972419d2294ffef85661dfb910a6ee40fe9/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f7468752d6d6c2f7469616e73686f753f6c6162656c3d6c617374253230757064617465) |
tianshou |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/a7ba9fe803c404e5b36b9b39f18b800fbd77986805603a2ae83c2a35e297829f/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f702d6368726973742f446565702d5265696e666f7263656d656e742d4c6561726e696e672d416c676f726974686d732d776974682d5079546f726368) |
![GitHub last commit](https://camo.githubusercontent.com/f088e893b539a161c2db36876e6b0e61447f461964f5c8fbc600ddebc3ff2e53/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f702d6368726973742f446565702d5265696e666f7263656d656e742d4c6561726e696e672d416c676f726974686d732d776974682d5079546f7263683f6c6162656c3d6c617374253230757064617465) |
Deep-Reinforcement-Learning-Algorithms-with-PyTorch |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/35d7ea9aa5d9b7929477317f4df1ce5c50b834d85612f849aaa8a7fda2640417/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f444c522d524d2f737461626c652d626173656c696e657333) |
![GitHub last commit](https://camo.githubusercontent.com/eb783cf6a455f37502486622fcfe98d1d94d37b7ac5f002050e90c99a5845755/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f444c522d524d2f737461626c652d626173656c696e6573333f6c6162656c3d6c617374253230757064617465) |
stable-baselines3 |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/5744dcdfcae41b3ec88f5dae7580fd9b365a02cb5bb23008e03649b7a9e7def3/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f66616365626f6f6b72657365617263682f52654167656e74) |
![GitHub last commit](https://camo.githubusercontent.com/27a254c4c9e7a0a8ba8fbeca15351bcb82f5b302f11f5aaf13d5450e4c4a1b28/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f66616365626f6f6b72657365617263682f52654167656e743f6c6162656c3d6c617374253230757064617465) |
ReAgent |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/a9dfff1b5e42d43a3f92f48a26b8c039480e871dd948fc5e2fccb78294f84860/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f646565706d696e642f6f70656e5f737069656c) |
![GitHub last commit](https://camo.githubusercontent.com/46bd08a674fbab36b559d0330bdc77c297a285b0e0954a4c8083e70629251b8d/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f646565706d696e642f6f70656e5f737069656c3f6c6162656c3d6c617374253230757064617465) |
open_spiel |
pytorch, tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/76b15c7e97de99982d3e579fb86e819c862bba7bff71599bb1fe0e1ccc7962e8/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f646565706d696e642f7472666c) |
![GitHub last commit](https://camo.githubusercontent.com/471e90a619a2a75182d74fa7fb0aee50859c795affb0ed82c8252c0aca769541/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f646565706d696e642f7472666c3f6c6162656c3d6c617374253230757064617465) |
trfl |
tensorflow-2.x, tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/a4be07b92718bc9f9a1f6905b47f5e7a2267fde7ce4b3ceff9714e8d8caa3688/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f74656e736f72666f7263652f74656e736f72666f726365) |
![GitHub last commit](https://camo.githubusercontent.com/e78f9b706fc48aa05c33ccd72ffa8e41979fab387833ce5850542ac17ab22c71/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f74656e736f72666f7263652f74656e736f72666f7263653f6c6162656c3d6c617374253230757064617465) |
tensorforce |
tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/6d7dca798dd1a8a509b89ae60accb691ffaeec37316e6921f46c7497e688d621/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f696b6f737472696b6f762f7079746f7263682d6132632d70706f2d61636b74722d6761696c) |
![GitHub last commit](https://camo.githubusercontent.com/41ad0fe3e3712ce33c7250e0a3b412b1beecd5640e7aec078c2bf39ad865bf7d/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f696b6f737472696b6f762f7079746f7263682d6132632d70706f2d61636b74722d6761696c3f6c6162656c3d6c617374253230757064617465) |
pytorch-a2c-ppo-acktr-gail |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/140915fe4dd91949c04e95629b4f1000737b7cad555bbdc35a6d893acc20016d/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f646565706d696e642f61636d65) |
![GitHub last commit](https://camo.githubusercontent.com/1f40e42d36211901adc75c764d977ed3677371b0cadc3d9aa5971e6c7968617e/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f646565706d696e642f61636d653f6c6162656c3d6c617374253230757064617465) |
acme |
jax, tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/d696d2d9b4ef08fe5dcae5180209cb19e5873eaa29e6bf617a53eef80838c013/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6b7761692f446f755a65726f) |
![GitHub last commit](https://camo.githubusercontent.com/d4bb8a86151a23b60431b92a9582120946ccd3a697499cca374407ebc783d1f8/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6b7761692f446f755a65726f3f6c6162656c3d6c617374253230757064617465) |
DouZero |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/5506a2a5f33dd4cc7ce7768c8aec837ac0533f7cc3494aac99e6e2cd628899ed/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f506164646c65506164646c652f5041524c) |
![GitHub last commit](https://camo.githubusercontent.com/7ef8ad17575ef31960307537291b982f0d86c9796594e403580c87f9421843fd/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f506164646c65506164646c652f5041524c3f6c6162656c3d6c617374253230757064617465) |
PARL |
paddle, pytorch |
![GitHub stars](https://camo.githubusercontent.com/d1d64057baa749d5d22bb1303ce15dda92ee3e8b76664c38fa57d58e14d77508/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f74656e736f72666c6f772f6167656e7473) |
![GitHub last commit](https://camo.githubusercontent.com/0ed65ee8f503233c283515424befa3f78c3aee4a03f2b182512360e31de0ad61/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f74656e736f72666c6f772f6167656e74733f6c6162656c3d6c617374253230757064617465) |
agents |
tensorflow-2.x, tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/c0784151fc93fcd6d9ff4135455356f986f4fc100e92e6c6acbc48d7bfc63ae8/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f496e74656c4c6162732f636f616368) |
![GitHub last commit](https://camo.githubusercontent.com/4deec427427f680d449a0234cd33af0cf094d26553aae0ddec231590995740b3/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f496e74656c4c6162732f636f6163683f6c6162656c3d6c617374253230757064617465) |
coach |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/03130dd63b7b18e6c8d63be59f029d1faff68b2ba3db9ee30851216fb51c6f46/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6173746f6f6b652f726c707974) |
![GitHub last commit](https://camo.githubusercontent.com/c4a6381bfee0d40a23ce88f9a7f4bf2cc2d6435fe7792d9d03e509cddad3a302/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6173746f6f6b652f726c7079743f6c6162656c3d6c617374253230757064617465) |
rlpyt |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/38246c671b12c7ea1178840fa7a4dd233172095e9a08c6f1f9d331d0bcc1507b/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f41493446696e616e63652d466f756e646174696f6e2f456c6567616e74524c) |
![GitHub last commit](https://camo.githubusercontent.com/530451ea5c41b9ca53d225f014604a06a315b547a59a6f1aca1598c46af47e3e/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f41493446696e616e63652d466f756e646174696f6e2f456c6567616e74524c3f6c6162656c3d6c617374253230757064617465) |
ElegantRL |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/10d6946042ab9f752c85da097af526c7ee949b6a238ab5bcb5b78020a6d664ec/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f7261696c2d6265726b656c65792f726c6b6974) |
![GitHub last commit](https://camo.githubusercontent.com/cfb39fd79ab41745ffc494ec5b9777aa2df72248ee6369909ea3989cda88f194/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f7261696c2d6265726b656c65792f726c6b69743f6c6162656c3d6c617374253230757064617465) |
rlkit |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/c992f47df88fb89875b8eb8d5dedd43e9ee4aee6704c2748374ef535e620c00b/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f646174616d6c6c61622f726c63617264) |
![GitHub last commit](https://camo.githubusercontent.com/5d4c0eef23f9a456f315d722b96d868bc0d5263ffc17262713c28114e976a32a/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f646174616d6c6c61622f726c636172643f6c6162656c3d6c617374253230757064617465) |
rlcard |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/fd84db8ae3226e622236baa8512e302628d83390b335fff57aae3566453cb052/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f726c776f726b67726f75702f676172616765) |
![GitHub last commit](https://camo.githubusercontent.com/55af90292b89dfa00e40ddee9c6190b31e8f65cc5b3e16d295b334eaf219613d/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f726c776f726b67726f75702f6761726167653f6c6162656c3d6c617374253230757064617465) |
garage |
tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/9a1c51b9207efeb709d64a010149b4448c84e4fd23b6e09280659db9550f9d37/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6b656e677a2f534c4d2d4c6162) |
![GitHub last commit](https://camo.githubusercontent.com/8f71f239616c20cb719998a17e9c66e89ec101efc3f88878910de62e39ecc02c/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6b656e677a2f534c4d2d4c61623f6c6162656c3d6c617374253230757064617465) |
SLM-Lab |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/10dad2c40eea5b5e4d6a7dae7c8c233ce536d1e449caaf92044b68c8f29e53a8/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f636861696e65722f636861696e6572726c) |
![GitHub last commit](https://camo.githubusercontent.com/7a7c0be1e6edb2af5956dd30c644b8b5ee880d177a2f8832ac20b5b7699646c1/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f636861696e65722f636861696e6572726c3f6c6162656c3d6c617374253230757064617465) |
chainerrl |
chainer |
![GitHub stars](https://camo.githubusercontent.com/490c549ec5daaaf78fe216b5893563dc7b2b41d92413dcc6e397957cefdf9d42/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f676f6f676c652d72657365617263682f62617463682d70706f) |
![GitHub last commit](https://camo.githubusercontent.com/4ecfa4c584f5aa16d4fed2ba04fe2e74843471c5b6ddc95f65b0033f3cf18cbb/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f676f6f676c652d72657365617263682f62617463682d70706f3f6c6162656c3d6c617374253230757064617465) |
batch-ppo |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/ebbe41b7ab2678137773ad83c0ccb8debf2bd73c68f719d9e6b0e30fbf8064e8/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f646565706d696e642f7363616c61626c655f6167656e74) |
![GitHub last commit](https://camo.githubusercontent.com/012b2167b413719b0fed22e04fa451b69c2ca9c83e51d82f8976fc409d8e82f1/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f646565706d696e642f7363616c61626c655f6167656e743f6c6162656c3d6c617374253230757064617465) |
scalable_agent |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/f3599281e8a9922ce5cc0bb790507353c5c6e013336cd08cbc8b5cbd60886932/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f767778797a6a6e2f636c65616e726c) |
![GitHub last commit](https://camo.githubusercontent.com/51d8dfef70221a9f4b40b6c398fad05b6fd5eebe82d7f980a76bd5008c4827d6/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f767778797a6a6e2f636c65616e726c3f6c6162656c3d6c617374253230757064617465) |
cleanrl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/4ff980ddb18f7adcfc79c26f8ac0167cfa842f28dac0243dff7866889bb01235/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f70666e65742f7066726c) |
![GitHub last commit](https://camo.githubusercontent.com/77bc86f36cbc1a044c324f00b87b3e15d3693ac14dd3d5b07b3983830bf25ef8/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f70666e65742f7066726c3f6c6162656c3d6c617374253230757064617465) |
pfrl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/5ef9f143db5d3a10027d42012bcdeb1cc2f2e5389ee54d594296d129863b0e76/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f676f6f676c652d72657365617263682f736565645f726c) |
![GitHub last commit](https://camo.githubusercontent.com/f04334512c2a317c1803432981e70c4b47ea70437ffb7a8889da6157d4ad70c2/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f676f6f676c652d72657365617263682f736565645f726c3f6c6162656c3d6c617374253230757064617465) |
seed_rl |
tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/413de27c524c454e60b1802da371d0ef81373139876b10d686b20388f4db46a1/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f66616365626f6f6b72657365617263682f746f7263686265617374) |
![GitHub last commit](https://camo.githubusercontent.com/6dbc0635ddf4944692f2f02212bfda4d5f5258e3dd8c1cf432dc09cb4678042a/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f66616365626f6f6b72657365617263682f746f72636862656173743f6c6162656c3d6c617374253230757064617465) |
torchbeast |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/ca8c54c85ab8360bd0750046f7c9962c4c51e9354de87945676893688676b2b4/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f4e566c6162732f47413343) |
![GitHub last commit](https://camo.githubusercontent.com/de220a1581ec42cc627de4080988376438891e27c5096e3da2dcbd731d9ee81a/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f4e566c6162732f474133433f6c6162656c3d6c617374253230757064617465) |
GA3C |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/5cefba9fc545cf56f1c5b491fbee7bd20e2dba98149074d11942d088ad68b07b/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f74616b7573656e6f2f6433726c7079) |
![GitHub last commit](https://camo.githubusercontent.com/8adc57e72a9d5f6b46d80df62f81788c0a387ad612de638ce10b082dd44daa4c/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f74616b7573656e6f2f6433726c70793f6c6162656c3d6c617374253230757064617465) |
d3rlpy |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/92172b8d75bbd1ebdc784f18fb89239d15c9f9353da015746c8fe80d6e990323/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f66616365626f6f6b72657365617263682f6d62726c2d6c6962) |
![GitHub last commit](https://camo.githubusercontent.com/c41858418c43bf95eef047f582db1fa3e1385724263a21be37c6b12fe24c2644/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f66616365626f6f6b72657365617263682f6d62726c2d6c69623f6c6162656c3d6c617374253230757064617465) |
mbrl-lib |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/69f3f447abf40a9b7ee3e3aa849a2afaeb1f7571864203e873c7df3b617abdfb/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f4d757368726f6f6d524c2f6d757368726f6f6d2d726c) |
![GitHub last commit](https://camo.githubusercontent.com/be79e6a08a9fe48ce35c52a678620e9774cad129c0f2e880244ac759cee11af3/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f4d757368726f6f6d524c2f6d757368726f6f6d2d726c3f6c6162656c3d6c617374253230757064617465) |
mushroom-rl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/481846a3ac1b6dc0a1a6fa9d6206b5c13457f9616f37d37f4eb755cf129e9cca/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f63706e6f74612f6175746f6e6f6d6f75732d6c6561726e696e672d6c696272617279) |
![GitHub last commit](https://camo.githubusercontent.com/a039fdc8adc5836e873431c4bd198ffaa0295443bb321ce7e235efe6235afda7/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f63706e6f74612f6175746f6e6f6d6f75732d6c6561726e696e672d6c6962726172793f6c6162656c3d6c617374253230757064617465) |
autonomous-learning-library |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/cf5398373d38c0223b7b5a076b1dd269d9b112016c8fa5ae509f001eb7b9e1a9/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f646565706d696e642f726576657262) |
![GitHub last commit](https://camo.githubusercontent.com/e784f86fe5a16066c554441f6a57c4ca60554023ad276f6bd4d904d2267531f7/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f646565706d696e642f7265766572623f6c6162656c3d6c617374253230757064617465) |
reverb |
jax, tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/8b37e7edd7a526a69627e7eae521b30f70a7664de2913d7572558e22a52c85a7/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6f70656e64696c61622f44492d656e67696e65) |
![GitHub last commit](https://camo.githubusercontent.com/eea7adf77aa1e26be3ad147ac76ef659f1c8c7660cdf60d1e8ba7ee52e3004d0/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6f70656e64696c61622f44492d656e67696e653f6c6162656c3d6c617374253230757064617465) |
DI-engine |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/02903a3e4ca20bb0c1525d67412e4859fd057f0de8840f840eaccf4367bb535e/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f56696e462f64656572) |
![GitHub last commit](https://camo.githubusercontent.com/db38e7a905009225ed864c031728f116cd7789c99fe0ca6fe7df5a994ce00cc1/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f56696e462f646565723f6c6162656c3d6c617374253230757064617465) |
deer |
tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/4f6494b14b38687ac0718b970de177d0bb2905925132e22a385d0549afcefb37/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f5375727265616c41492f7375727265616c) |
![GitHub last commit](https://camo.githubusercontent.com/35275d8237b0597883dda4ccec31bbcc894a0ed8cae1bf9e6378d78b8fba94d0/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f5375727265616c41492f7375727265616c3f6c6162656c3d6c617374253230757064617465) |
surreal |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/7f3544d6ef652f817bb4be6239d48bd7dd9a57803cd7190051639d3304c22464/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6d656469706978656c2f726c5f616c676f726974686d73) |
![GitHub last commit](https://camo.githubusercontent.com/5ef3f3b40b044c3d3330ddcc3059a4bd93899bfba343591399f9a2c207f0406e/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6d656469706978656c2f726c5f616c676f726974686d733f6c6162656c3d6c617374253230757064617465) |
rl_algorithms |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/3d852f1224f950641f0dd36d16ff84409c71c26066d231dbe5eba1b90146fe7f/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f646f6e676d696e6c656539342f646565705f726c) |
![GitHub last commit](https://camo.githubusercontent.com/0e4f5022c5d1175fd0553df58902e7c630eb4a96e814a0590a79e953d629ccde/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f646f6e676d696e6c656539342f646565705f726c3f6c6162656c3d6c617374253230757064617465) |
deep_rl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/d356129981caa9363b4dce8f3a90f379dbbf938556d90857e2967c5f2a694247/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6c637377696c6c656d732f726c2d737461727465722d66696c6573) |
![GitHub last commit](https://camo.githubusercontent.com/1137b6fcd0ddc56327eea64294c63553b72f11b9c72846671012ffb51c7ac6dd/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6c637377696c6c656d732f726c2d737461727465722d66696c65733f6c6162656c3d6c617374253230757064617465) |
rl-starter-files |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/bd445eba0af30bee12acdef8e21f1b1eaa001c652397090a922a109919f4f596/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f66616365626f6f6b72657365617263682f73616c696e61) |
![GitHub last commit](https://camo.githubusercontent.com/1d41555cacce69b8c8ce2ec3c0ffad6d58bcc9127dce4d0f59c9d7899770adf5/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f66616365626f6f6b72657365617263682f73616c696e613f6c6162656c3d6c617374253230757064617465) |
salina |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/32bbf8e0bf2d9fb19fc3a24babbe5f6f297b184ee506e774e80e04e1e92d0694/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f53666f724169446c2f67656e726c) |
![GitHub last commit](https://camo.githubusercontent.com/0a7e55e1d176ef8c9aadd0b4db714b875e0529a40d1dae4cca30b390781a2496/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f53666f724169446c2f67656e726c3f6c6162656c3d6c617374253230757064617465) |
genrl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/41a7860c5c01bbe7fcb0daab680c8f7a76e2700d8d661551a933898b9cca75a7/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f537465704e6576657253746f702f524c73) |
![GitHub last commit](https://camo.githubusercontent.com/27a097ba82b71328699f0a36d536d76c5e44d0e38c78db2fe409458931428307/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f537465704e6576657253746f702f524c733f6c6162656c3d6c617374253230757064617465) |
RLs |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/c8fdaf75988bf2f472a3de06a70dd1854cba719f18780f2affe66d79b167bd36/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f7a756f78696e67646f6e672f6c61676f6d) |
![GitHub last commit](https://camo.githubusercontent.com/129978abcbe92865ac6f846555e2b86b237d50ed1101511806b69197a5f0c4bd/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f7a756f78696e67646f6e672f6c61676f6d3f6c6162656c3d6c617374253230757064617465) |
lagom |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/b4220ff084825d2a0c2335d2b697b94c8e1e98771552a1986c4c039bebbe69f9/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f52616661656c31732f446565702d5265696e666f7263656d656e742d4c6561726e696e672d416c676f726974686d73) |
![GitHub last commit](https://camo.githubusercontent.com/a496642afaafc502042ff19648de8c765358a4b8f233708d3ff9f837ab41c3de/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f52616661656c31732f446565702d5265696e666f7263656d656e742d4c6561726e696e672d416c676f726974686d733f6c6162656c3d6c617374253230757064617465) |
Deep-Reinforcement-Learning-Algorithms |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/0aa10fc826022e88b1e27e81d2271950fae31b48f211d8b5fc0f8f6f9e29ed55/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f656c657572656e742f726c2d6167656e7473) |
![GitHub last commit](https://camo.githubusercontent.com/4a09b4a6f7413f79e2857437711f91036846c2a1bbb0c7c9acd190648cd9aaa5/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f656c657572656e742f726c2d6167656e74733f6c6162656c3d6c617374253230757064617465) |
rl-agents |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/2eb5614b5c98befe8a11d2f3c70a4ec37d7ad3070dffd56b64710a268b6d8214/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f676f6f676c652d72657365617263682f62617463685f726c) |
![GitHub last commit](https://camo.githubusercontent.com/8d3b747a3279c37f1d576f2ac71043a00a69c5784a9c84561302a2b08d4bd91f/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f676f6f676c652d72657365617263682f62617463685f726c3f6c6162656c3d6c617374253230757064617465) |
batch_rl |
tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/28d2ad2759ce1285f5f2cb3d9b77b8cd6215ed4d154192bcc8c4ed3c9305895d/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f666162696f706172646f2f746f6e6963) |
![GitHub last commit](https://camo.githubusercontent.com/d709ae3166064be319afe1b4edc4853048e23b762322698b76d84684f353a554/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f666162696f706172646f2f746f6e69633f6c6162656c3d6c617374253230757064617465) |
tonic |
pytorch, tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/763280eff0c44c104ef03d0d5ad2b7c4ec9db036afd3f8efafd37ae4484ad18d/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f616c65782d70657472656e6b6f2f73616d706c652d666163746f7279) |
![GitHub last commit](https://camo.githubusercontent.com/a06ae6e26b88ad993eafd3d0ec8b764b3bd15a5d8ba0288d9ac06d48633b13f0/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f616c65782d70657472656e6b6f2f73616d706c652d666163746f72793f6c6162656c3d6c617374253230757064617465) |
sample-factory |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/580f0d304d5f6deff144aa1bf505b836256b4b73e8fb8863a2e80c15da131cee/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f696b6f737472696b6f762f6a6178726c) |
![GitHub last commit](https://camo.githubusercontent.com/aa2c4c02b9d241c096b97fb20a3539d1da7ebb80f1c55c113a7e0ae728ddf5ce/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f696b6f737472696b6f762f6a6178726c3f6c6162656c3d6c617374253230757064617465) |
jaxrl |
jax |
![GitHub stars](https://camo.githubusercontent.com/63f09e87226fd7c80798b38086344590a404e1606e060033578582f7235555f6/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6b616b616f656e74657270726973652f4a4f524c4459) |
![GitHub last commit](https://camo.githubusercontent.com/9c20fa31aa7c887951ae1b9e3a4a97afbf2715de50604e5e3bb137462664e435/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6b616b616f656e74657270726973652f4a4f524c44593f6c6162656c3d6c617374253230757064617465) |
JORLDY |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/c7a5c5bda269944bc22ef4b5d0e10a3bfb45f62477c67ffbc8f94c6ed4240abe/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f726c67726170682f726c6772617068) |
![GitHub last commit](https://camo.githubusercontent.com/afbe5af03a62831f286ab4fe066255caebcb08f2e53daecada6d0d0954cc0bd2/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f726c67726170682f726c67726170683f6c6162656c3d6c617374253230757064617465) |
rlgraph |
pytorch, tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/12806455cd7b63e67ccd0c5eb9e4a3f968a2f01944e3b3db3279c7993aa1f757/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f69666669582f6d616368696e) |
![GitHub last commit](https://camo.githubusercontent.com/3c953e87d7f3662084253366a4e5c40892ca0b406a3529463b60b5366ebcacbf/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f69666669582f6d616368696e3f6c6162656c3d6c617374253230757064617465) |
machin |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/97e687d3aa98434971c5a492722ae84e147821165c5b4a7ba8b274e896947912/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f736a74752d6d61726c2f6d616c6962) |
![GitHub last commit](https://camo.githubusercontent.com/db6e7eb43a53dedec8de2a87327ae0f91e4e5dafbb40dbf991d6de474a758e36/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f736a74752d6d61726c2f6d616c69623f6c6162656c3d6c617374253230757064617465) |
malib |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/5112a286bb84ad0bbd73b79d7a459a0298bcb0f25513eeb85fdeaa8568350e42/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f66616365626f6f6b72657365617263682f726c6d657461) |
![GitHub last commit](https://camo.githubusercontent.com/361bc15aa2d17040a30221e100ac31d59d588097f2ac398f09a8c738950c3086/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f66616365626f6f6b72657365617263682f726c6d6574613f6c6162656c3d6c617374253230757064617465) |
rlmeta |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/30e7d327b291c96ab42f944e0f41f236177f22352acd78c276a1b5c51c1e8c0e/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f66616365626f6f6b72657365617263682f726c73747275637475726573) |
![GitHub last commit](https://camo.githubusercontent.com/ea298eff9abd89acd05230ceed046755e7f3c2523b5534baa676a9d32da29341/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f66616365626f6f6b72657365617263682f726c737472756374757265733f6c6162656c3d6c617374253230757064617465) |
rlstructures |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/a420215603ef7aef36d7b43456640a186904e5d6b13344764f110116a4d5ef38/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f524954434849454875616e672f44656570524c5f416c676f726974686d73) |
![GitHub last commit](https://camo.githubusercontent.com/8185d948420328f8da8ae6478f76993f1504f1e24f37d5dca2feee964f307d4c/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f524954434849454875616e672f44656570524c5f416c676f726974686d733f6c6162656c3d6c617374253230757064617465) |
DeepRL_Algorithms |
pytorch, tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/5362f47198991063d70fe45966967cddbe71efac9380f0dbc3141c83d5e8ed29/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6875617765692d6e6f61682f78696e677469616e) |
![GitHub last commit](https://camo.githubusercontent.com/6fb378ad387b3f5efdc54cc47173f4a35685851b057360645dc97b1e52ac05ed/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6875617765692d6e6f61682f78696e677469616e3f6c6162656c3d6c617374253230757064617465) |
xingtian |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/eeb4be78c11c9311ae7f8ed6de58ba352c3b9d034d6114b2be246080b0671ab1/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f44654e412f48616e6479524c) |
![GitHub last commit](https://camo.githubusercontent.com/6203ef5b32ce285b3cb7422a9eb73cd92f154268afcef4b3be45fb329347642c/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f44654e412f48616e6479524c3f6c6162656c3d6c617374253230757064617465) |
HandyRL |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/bbfbe46661b86bfe99ca48ea1dfdc85b4ee29e478a7566fc11fa26a8ca36ea8e/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f44656e797338382f726c5f67616d6573) |
![GitHub last commit](https://camo.githubusercontent.com/9613dea458b2fec0aed13af261c93ae410a744a8dcd29c3e636efe65bfc31c2e/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f44656e797338382f726c5f67616d65733f6c6162656c3d6c617374253230757064617465) |
rl_games |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/b2bf918ab81a199a9f158b8b111685628e2e285c15753ba575a3bc33002a1c71/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f64617669642d6162656c2f73696d706c655f726c) |
![GitHub last commit](https://camo.githubusercontent.com/2332feee31a7e44a6ca10eb9190a885c9779f651bd1167fbd40cf3d62c3fbd07/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f64617669642d6162656c2f73696d706c655f726c3f6c6162656c3d6c617374253230757064617465) |
simple_rl |
numpy |
![GitHub stars](https://camo.githubusercontent.com/1a4effde1c68cb95adbc506c608f9e8f4fdc81b4be4bb50b88985fd23a2525e6/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f537461626c652d426173656c696e65732d5465616d2f737461626c652d626173656c696e6573) |
![GitHub last commit](https://camo.githubusercontent.com/202780e8dcdfd91c5799a205de1b65b3f81518844ac1d7137ecb03480a120f73/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f537461626c652d426173656c696e65732d5465616d2f737461626c652d626173656c696e65733f6c6162656c3d6c617374253230757064617465) |
stable-baselines |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/60900aa2709efc2d89146396f050c8e23caca2bfb2944b5956124a6c88e4faa2/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f726c6c2d72657365617263682f75726c5f62656e63686d61726b) |
![GitHub last commit](https://camo.githubusercontent.com/07371e26e5847bf38d62d8dddaeeddbcc362c726fdfdb774e7c3c33a6dfcaa71/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f726c6c2d72657365617263682f75726c5f62656e63686d61726b3f6c6162656c3d6c617374253230757064617465) |
url_benchmark |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/a9ea2f35f45a2b6b98205e8873a0cff41edc39ff375e7a28535fcf6634640c64/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f416c6672656476632f70616163) |
![GitHub last commit](https://camo.githubusercontent.com/d9ce1562bd440ff9b7cd7cd7d19a244db124f5219d946e5886e16650626a967b/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f416c6672656476632f706161633f6c6162656c3d6c617374253230757064617465) |
paac |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/05fc2f2e57dd713732639329acd4a34a192d596450f552f5163258cefafb5789/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f65646265656368696e672f676f646f745f726c5f6167656e7473) |
![GitHub last commit](https://camo.githubusercontent.com/5b9592f715bf41b80bbdf82feb533b3b4dbb3ab4bfb826ad9cf9fddde6beafff/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f65646265656368696e672f676f646f745f726c5f6167656e74733f6c6162656c3d6c617374253230757064617465) |
godot_rl_agents |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/946085d4c290f5719fceb9168f1d5538c1b61e413aa1b69b96e0c8a46feeeb42/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6865726f6e73797374656d732f6164657074524c) |
![GitHub last commit](https://camo.githubusercontent.com/6e7cc9532e445076599ea6de416fc3e2fa58422174a03a975962abac6ac1138d/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6865726f6e73797374656d732f6164657074524c3f6c6162656c3d6c617374253230757064617465) |
adeptRL |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/0dfb4b5c97fd918c35160e969a69890bc14897e2a26ba225d2864ab7df7b60f2/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f756265722d72657365617263682f6170652d78) |
![GitHub last commit](https://camo.githubusercontent.com/d435ba4c24c4e5b4978b1949954604df47879e6c387c049b568dba8d954fd2d0/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f756265722d72657365617263682f6170652d783f6c6162656c3d6c617374253230757064617465) |
ape-x |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/fd2156fc4b093acae2a13919804f8d01d03046a4104a215df03ff2af61c4ed40/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f696e6665722d6163746976656c792f70796d6470) |
![GitHub last commit](https://camo.githubusercontent.com/0cf67d7dbc52034a6bf41448315942e028d06539dca4a76f2d843bcf3c107852/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f696e6665722d6163746976656c792f70796d64703f6c6162656c3d6c617374253230757064617465) |
pymdp |
numpy |
![GitHub stars](https://camo.githubusercontent.com/03580f3f5218666a78e5e2bb2fb23e60faf0618cb81a37115da4a7bc239cff29/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f526368616c59616e672f746f726368726c) |
![GitHub last commit](https://camo.githubusercontent.com/1eae3ee4ab642d4f0acf4c2836fb42f6f64fe2dabab49ee9f918450adaa07b94/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f526368616c59616e672f746f726368726c3f6c6162656c3d6c617374253230757064617465) |
torchrl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/1efff49e2c4ac9cf7402d943a25bea7ad27513edd5c3ceb872ab826530330c9a/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f66616365626f6f6b72657365617263682f6d74726c) |
![GitHub last commit](https://camo.githubusercontent.com/26c6a65b83d8fe85b59f777040104bdf77277568070ccf44de051bbe20424b68/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f66616365626f6f6b72657365617263682f6d74726c3f6c6162656c3d6c617374253230757064617465) |
mtrl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/e434239170d00744db2935cf3f2ff54720f7f92f6edc9243211f04e63d2b0d01/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f616c69626162612f456173795265696e666f7263656d656e744c6561726e696e67) |
![GitHub last commit](https://camo.githubusercontent.com/c9074c2825e68796829eab08ae987d8f622373e6c452987a0dd5b6eb323856ab/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f616c69626162612f456173795265696e666f7263656d656e744c6561726e696e673f6c6162656c3d6c617374253230757064617465) |
EasyReinforcementLearning |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/526fe624c1aad9ee56950bae33b9389a5649aa7ed62952bcc7d73e5ba1a02453/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f66616365626f6f6b72657365617263682f726c) |
![GitHub last commit](https://camo.githubusercontent.com/c71824a1f158e2fbd5bd109d5a1ec572d43165773440b3bdfd5ca04a6c40ac26/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f66616365626f6f6b72657365617263682f726c3f6c6162656c3d6c617374253230757064617465) |
rl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/a7db793fc776be3319684be9615c85d7401f69abb9adfb447fbf96e95ec26e71/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f756f652d6167656e74732f6570796d61726c) |
![GitHub last commit](https://camo.githubusercontent.com/d62607241ecd487876a5190e9919ff6b8ff242bf8618da5ad012f633640dbaa9/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f756f652d6167656e74732f6570796d61726c3f6c6162656c3d6c617374253230757064617465) |
epymarl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/daf2a7fa7d68e25e682a5e43e32aaccd6ec7c49cfc9c5b2c905150ef59be8161/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f74656e63656e742d61696c61622f746c65616775655f70726f6a70616765) |
![GitHub last commit](https://camo.githubusercontent.com/810432dc557d6c80d34fdaa1e356022e54ab4815aff4aae61923c967c408c6fc/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f74656e63656e742d61696c61622f746c65616775655f70726f6a706167653f6c6162656c3d6c617374253230757064617465) |
tleague_projpage |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/060c0c581c3a6f991bb377af32f4eaa5d525961466c6d9c5bbbbce7f272805de/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f676f6f676c652f64656c756361) |
![GitHub last commit](https://camo.githubusercontent.com/c0b1b84d06bb428b85f2e62c9d5fad1639940ceaf21d04eadbe3421c1004e351/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f676f6f676c652f64656c7563613f6c6162656c3d6c617374253230757064617465) |
deluca |
jax |
![GitHub stars](https://camo.githubusercontent.com/0c771843ae28cad8cee7fccfa33c2f2f681691de7c5935bd67e1526c11da966f/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f676f6f676c652d72657365617263682f726c6473) |
![GitHub last commit](https://camo.githubusercontent.com/7224b3e5d33bc259d9614ad0f4bbb9532517e27e627645f510accf4d114ad67b/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f676f6f676c652d72657365617263682f726c64733f6c6162656c3d6c617374253230757064617465) |
rlds |
tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/ff8fba1fdbec7952cc11657943d79941d8d0325971f762a1bec6b2dba6128b5b/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f726c62657272792d70792f726c6265727279) |
![GitHub last commit](https://camo.githubusercontent.com/154d0e4add43792e77f539daeb3e8dd23acddf53f4ae68e23a33f3a757488e22/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f726c62657272792d70792f726c62657272793f6c6162656c3d6c617374253230757064617465) |
rlberry |
jax, pytorch |
![GitHub stars](https://camo.githubusercontent.com/3d9fbea6e07d58ee519d28eb8371d055b787bff3818de16b394b0ffc2a72a7e8/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f636f61782d6465762f636f6178) |
![GitHub last commit](https://camo.githubusercontent.com/e6366d8e64d9f86a4999929bb1214342644192f647504697279a0b70e1f4cd4d/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f636f61782d6465762f636f61783f6c6162656c3d6c617374253230757064617465) |
coax |
jax |
![GitHub stars](https://camo.githubusercontent.com/dcdb87bdcbeaedb04b3f9ec1ff5609416fee4df8a833464b6653e01f5c15918c/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f63796f6f6e313732392f6469737472696275746564524c) |
![GitHub last commit](https://camo.githubusercontent.com/9e291e2428b3ad7a8c609461229a56f14e6ee0c09d3c0182382e2896d962702e/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f63796f6f6e313732392f6469737472696275746564524c3f6c6162656c3d6c617374253230757064617465) |
distributedRL |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/a10e9946b66db0f1c1fd927c5f6d8740dd74446618c4e1f6289d628ee50bfa85/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f736368617474792f643470672d7079746f726368) |
![GitHub last commit](https://camo.githubusercontent.com/ef0b823cebdbd3c02f6a99532477467fb799ca7812afd752bef86eeec625d536/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f736368617474792f643470672d7079746f7263683f6c6162656c3d6c617374253230757064617465) |
d4pg-pytorch |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/999d4544ecb65da1644259e6fa8910b0aa3fd9af94e3ae7771b214e14ecddd5c/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f66616365626f6f6b72657365617263682f72656c61) |
![GitHub last commit](https://camo.githubusercontent.com/682405f3ea00db1b64a1ff994c96c289974e598805cc6a9f159c774af4d0795a/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f66616365626f6f6b72657365617263682f72656c613f6c6162656c3d6c617374253230757064617465) |
rela |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/db36624cd9cc879c1d86da14c3664bf7d0d47d7a84da99dae7058d10f492ed8b/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f657468616e6c756f79632f6d616769) |
![GitHub last commit](https://camo.githubusercontent.com/1bb0cd631b5e49c6ebd99f51346753e54d53bbb3f48f1a41b4c62a57e35953ca/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f657468616e6c756f79632f6d6167693f6c6162656c3d6c617374253230757064617465) |
magi |
jax |
![GitHub stars](https://camo.githubusercontent.com/4149cac66b7a0d737bfa00a2e7506b9ffb7aeaba2d53d51c80422b96afe6b2f1/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f7370697469732f6d726c) |
![GitHub last commit](https://camo.githubusercontent.com/7e7a8fa9ab1a5b59472f2a67e9975ab330f2b3a67619062dd8efd75f41645bfd/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f7370697469732f6d726c3f6c6162656c3d6c617374253230757064617465) |
mrl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/03c2a6575e1ce8b7c30af83e5f2f4896a93d19aa27c2c15dfa5ca3efab5ddabb/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f736f6e792f6e6e61626c612d726c) |
![GitHub last commit](https://camo.githubusercontent.com/e42ecff556d7bdec12007fb77b02a51a6f0209ee06bba1366af3f76b9a8e1f0c/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f736f6e792f6e6e61626c612d726c3f6c6162656c3d6c617374253230757064617465) |
nnabla-rl |
nnabla |
![GitHub stars](https://camo.githubusercontent.com/c3f83de5380d6bb571bdb7909291d12203c2b3c9ed132c82f53499e7095a18ad/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f457269636f6e616c646f2f494c5377697373) |
![GitHub last commit](https://camo.githubusercontent.com/63cb8b6cb8c8053cbc742a2ba7603e326b3a30e82b39c5890d388c4aa5d9c482/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f457269636f6e616c646f2f494c53776973733f6c6162656c3d6c617374253230757064617465) |
ILSwiss |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/7badb82697ffab55fa3ac8362b5e83cd1b910d54f25f3d608e827cd6e34782a1/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f676f6f676c652d72657365617263682f646565705f6f7065) |
![GitHub last commit](https://camo.githubusercontent.com/4c066720718878d893ed099202b991a1f29c03680522c2411f598192aabbfb71/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f676f6f676c652d72657365617263682f646565705f6f70653f6c6162656c3d6c617374253230757064617465) |
deep_ope |
tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/75ff4eb938c7a6a0ef2940dcd634cbd434ad2f9023f063c64a4ef8b52467bd43/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f74776e69323031362f706f6d64702d626173656c696e6573) |
![GitHub last commit](https://camo.githubusercontent.com/afec8f7de5de1109f7145c4d4c98fe9b2ece032d563c6653b676988a6a16462b/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f74776e69323031362f706f6d64702d626173656c696e65733f6c6162656c3d6c617374253230757064617465) |
pomdp-baselines |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/9dd99a5fe6adeae1d931fa775adbb0ee7ae7096b29d3b0790d0be2fb5bd16f54/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6b75323438322f726c6a6178) |
![GitHub last commit](https://camo.githubusercontent.com/54ca7d50b2911cbfd57497643e7fe67d7a45d8614f1e2305c050571b14e93f96/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6b75323438322f726c6a61783f6c6162656c3d6c617374253230757064617465) |
rljax |
jax |
![GitHub stars](https://camo.githubusercontent.com/c3bf8b02735b8ff750732765f81e70a67473880832d37bced5b7dd681aeafc3d/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f676f6f676c652f73696d706c652d7265696e666f7263656d656e742d6c6561726e696e67) |
![GitHub last commit](https://camo.githubusercontent.com/ac0877971eb95bf442d9b69a074face13462c79f688ac409a1116ed750098785/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f676f6f676c652f73696d706c652d7265696e666f7263656d656e742d6c6561726e696e673f6c6162656c3d6c617374253230757064617465) |
simple-reinforcement-learning |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/d43e2ce7f097cdf06ca84b702cc2fe51886628e10f7bf33ffa3ae167911a4e87/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f68656e72792d7072696f722f6a61782d726c) |
![GitHub last commit](https://camo.githubusercontent.com/c32bce0e6fbdf3d0ea5f90578e3f0f1546cf3f1371d2bf0b158d1d32f1644e1c/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f68656e72792d7072696f722f6a61782d726c3f6c6162656c3d6c617374253230757064617465) |
jax-rl |
jax |
![GitHub stars](https://camo.githubusercontent.com/603ebdbba74796556d7886748a5b486e9f40c6406e7a41204469b7210ccf3f36/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f796d642d682f6370707262) |
![GitHub last commit](https://camo.githubusercontent.com/dbb9c790723cdb8e83b0efcee3659242638a1ab64602332e971566cbc5e57624/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f796d642d682f63707072623f6c6162656c3d6c617374253230757064617465) |
cpprb |
|
![GitHub stars](https://camo.githubusercontent.com/b255bae462fd22f929374a98f87c5d6c54e22b43f45606efc63da9d558a912ef/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f686172692d73696b6368692f73616665524c) |
![GitHub last commit](https://camo.githubusercontent.com/461ccc3201b1844acb27ae697af73fa9fd1b76de73505d50439ee58a46f60032/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f686172692d73696b6368692f73616665524c3f6c6162656c3d6c617374253230757064617465) |
safeRL |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/094c998cb44339c6f1cd8617b333702dcd11b05650b3f241304b21875a647f4e/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f3078616e67656c6f2f7261796c6162) |
![GitHub last commit](https://camo.githubusercontent.com/b6dac78c53e61313bd2c90644018ac105cb499f240b96419b8075c7252380b1c/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f3078616e67656c6f2f7261796c61623f6c6162656c3d6c617374253230757064617465) |
raylab |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/14738a0221334ab4e4539a8304a21af0726f88234350d9749cead14591ab2ac2/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f716c616e332f4578706c6f726572) |
![GitHub last commit](https://camo.githubusercontent.com/701115bab928f9bf48e17850fcde62e34514bf03b3d0c2763cb9832085116fdf/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f716c616e332f4578706c6f7265723f6c6162656c3d6c617374253230757064617465) |
Explorer |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/7e04f476149f9943c943fe359f59acaac48a300e4c75be71c22838990afe871c/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f636c766f6c6f7368696e2f434f4253) |
![GitHub last commit](https://camo.githubusercontent.com/b4c21418d1ce309fb211f7f74991354e682d4bd8a0e4167d315fb974c6b83b14/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f636c766f6c6f7368696e2f434f42533f6c6162656c3d6c617374253230757064617465) |
COBS |
pytorch, tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/1541294015fd27cbbfa61afb7dd5866ea2553a1f14bb729745a27d1d84066dd9/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6173746f6f6b652f616363656c5f726c) |
![GitHub last commit](https://camo.githubusercontent.com/733f6ca089310712906a9d5de8079b0b0f960d2fbe55543d71593e60a8a94d68/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6173746f6f6b652f616363656c5f726c3f6c6162656c3d6c617374253230757064617465) |
accel_rl |
theano |
![GitHub stars](https://camo.githubusercontent.com/5771022bebc1350dee0929499a24c7edc0cd35063e6c9223356d551d8d7658ca/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f737465706a616d2f59415252) |
![GitHub last commit](https://camo.githubusercontent.com/c16eb27c8a6b7d94308f6e1d15cfd06b7acaca3737528604f62d9bf0a54f79f6/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f737465706a616d2f594152523f6c6162656c3d6c617374253230757064617465) |
YARR |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/21ff1c3c4ef7d219b53e723755f78c93df94cf5f85be70931f6be9af0e7dd48c/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f686172766172642d656467652f517561524c) |
![GitHub last commit](https://camo.githubusercontent.com/61be68966983cc062ffa7cfbca0d2be6116b173bc798e186c052dfa09bca88f4/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f686172766172642d656467652f517561524c3f6c6162656c3d6c617374253230757064617465) |
QuaRL |
tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/79328843a5296e40af2d4908b84a532d906e5f362358be903845ba9a78149d1a/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6f737564726c2f61706578) |
![GitHub last commit](https://camo.githubusercontent.com/b1cd07d76c1141d277aa3990db49e9d2abf0d369b0d3e611411d242615b021f9/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6f737564726c2f617065783f6c6162656c3d6c617374253230757064617465) |
apex |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/f945fe013fd393ef93a4042671bc54286cca84cd6a1b46023b14d66e9cffa0d1/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f686f726f6977612f646565705f7265696e666f7263656d656e745f6c6561726e696e675f67616c6c657279) |
![GitHub last commit](https://camo.githubusercontent.com/22d23d496d4e581269b0110f1aef28c94159a5b86ec33f36fc517c0c13f28cae/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f686f726f6977612f646565705f7265696e666f7263656d656e745f6c6561726e696e675f67616c6c6572793f6c6162656c3d6c617374253230757064617465) |
deep_reinforcement_learning_gallery |
tensorflow-2.x |
![GitHub stars](https://camo.githubusercontent.com/bd3e0baf01b322fee4676f1ab915aad07a984269ffbb82cdcfc13bebbf4b7048/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6b6e677779752f5261696e79) |
![GitHub last commit](https://camo.githubusercontent.com/158180781d86d4c569f80c602cb7575e7ffd8f568bb1146f9ae18a7d7122b8f3/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6b6e677779752f5261696e793f6c6162656c3d6c617374253230757064617465) |
Rainy |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/891e9407eb41285dfdb23aaab3e6ee767974cd4f6496650ee5f319970007a798/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6c6e732f6461706f) |
![GitHub last commit](https://camo.githubusercontent.com/773627b08fd93f74a072d611c7d3a2e33ea4a3a877b07639e39228dc06ef1ab8/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6c6e732f6461706f3f6c6162656c3d6c617374253230757064617465) |
dapo |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/bd3e0baf01b322fee4676f1ab915aad07a984269ffbb82cdcfc13bebbf4b7048/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6b6e677779752f5261696e79) |
![GitHub last commit](https://camo.githubusercontent.com/158180781d86d4c569f80c602cb7575e7ffd8f568bb1146f9ae18a7d7122b8f3/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6b6e677779752f5261696e793f6c6162656c3d6c617374253230757064617465) |
Rainy |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/5c421718c972f5b273d78952d9b69f6d6f871268c5da0fda0eceb0e89694d5f7/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6c6e732f6d656d6f697265) |
![GitHub last commit](https://camo.githubusercontent.com/eca259621ebb177c118385767fb01294c865dce77dabca307d724216bb35a384/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6c6e732f6d656d6f6972653f6c6162656c3d6c617374253230757064617465) |
memoire |
|
![GitHub stars](https://camo.githubusercontent.com/326878c9ee1cae9b580d25308f665e96ea740732a8ff391547f23e47e9631271/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f66616365626f6f6b72657365617263682f67616c61) |
![GitHub last commit](https://camo.githubusercontent.com/385b4bf58648db1b77af798bea568ae7a68cba9630fcbd62c25d9db0f67f6ec4/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f66616365626f6f6b72657365617263682f67616c613f6c6162656c3d6c617374253230757064617465) |
gala |
tesorflow-1.x |
![GitHub stars](https://camo.githubusercontent.com/a1f6f496aa53e887a4972eb065743e63a20f890602083e3fb36cd96efa6b73df/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f496f754a656e4c69752f4854532d524c) |
![GitHub last commit](https://camo.githubusercontent.com/89a3ebc71d4f687c004dd88e8446dbd95f205bccf6b9ed2beeabf4b17eecfefb/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f496f754a656e4c69752f4854532d524c3f6c6162656c3d6c617374253230757064617465) |
HTS-RL |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/6bf5c4a75b57eedb83779fe6f5f772476b47e88304250dd1fc0441327b94f83b/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f7175616e74756d697261636c652f4d415253) |
![GitHub last commit](https://camo.githubusercontent.com/5a6df4c0eb4c2932d4b2faac2f05bde683e4cb8f05124238479a903a5754c536/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f7175616e74756d697261636c652f4d4152533f6c6162656c3d6c617374253230757064617465) |
MARS |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/ecfcf9dee7108609b45c5289379d1bdfc57b05a95c688460ecbd174e7efad271/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f696e64796c61622f6e78646f) |
![GitHub last commit](https://camo.githubusercontent.com/0a01cf15d8459bc68d904da18be4f32b7d18521446467d993ab5603972fe9564/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f696e64796c61622f6e78646f3f6c6162656c3d6c617374253230757064617465) |
nxdo |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/1d09061c248390f4a2211cb79faddede93ddf1f02a4082829a5f202531f21cbe/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f52656454616368796f6e2f636f6c7472612d726c) |
![GitHub last commit](https://camo.githubusercontent.com/46ba21fea5760c344e95a1cb3146cb4b32efc83396548c33285966aec1388833/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f52656454616368796f6e2f636f6c7472612d726c3f6c6162656c3d6c617374253230757064617465) |
coltra-rl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/75cfdbc89c0bbda2bbdc401390be787f9e04eb2d0c7fddfdcfba1f7987412088/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f73656d697461626c652f666173742d6d61726c) |
![GitHub last commit](https://camo.githubusercontent.com/ebb7318d8a597a34fde328eb2aed0c6cd69631468540030a6efce852270e5c83/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f73656d697461626c652f666173742d6d61726c3f6c6162656c3d6c617374253230757064617465) |
fast-marl |
pytorch |
![GitHub stars](https://camo.githubusercontent.com/d765c8c031a721e8c14e3b629621ca13bbb4aece7a9b7264c12ce4eb4b0dcf27/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f6370756865617465722f63617573652d6c6966652d69732d612d67616d65) |
![GitHub last commit](https://camo.githubusercontent.com/a94348058aef70b7da5a6540e3dadf3b576207f3e94a7924072175014e85b97e/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f6370756865617465722f63617573652d6c6966652d69732d612d67616d653f6c6162656c3d6c617374253230757064617465) |
cause-life-is-a-game |
pytorch |
RL Accelerated Environment
Star |
Last Update |
Name |
Accelerate Type |
Property |
/ |
/ |
vec_env |
subproc [1] [2] |
all |
![GitHub stars](https://camo.githubusercontent.com/f004ec013822614fab0252755b2822b4115ee36a5d43c2fcb94509c227eae845/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f7361696c2d73672f656e76706f6f6c) |
![GitHub last commit](https://camo.githubusercontent.com/a5e2e234a50e2aeff6a11b026eb57bbfc7dd8e6a9ae310e3eceafcea4d182550/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f7361696c2d73672f656e76706f6f6c3f6c6162656c3d6c617374253230757064617465) |
EnvPool |
cpp |
Atari, Mujoco, Compilable environment |
![GitHub stars](https://camo.githubusercontent.com/26360edefff6035432212f5162276a7f296f587e786f8021b79eb77e6dfee5dc/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f66616365626f6f6b72657365617263682f454c46) |
![GitHub last commit](https://camo.githubusercontent.com/3c7392aea686db648bc28f21e9193beb0a7b4dcce71ec2d847490a0140757928/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f66616365626f6f6b72657365617263682f454c463f6c6162656c3d6c617374253230757064617465) |
ELF |
cpp |
Game in cpp, MiniRTS |
![GitHub stars](https://camo.githubusercontent.com/075d79489bd9b73b696d48e211b7a4e78029aa4794af5e3dfe058b8bcb6d75fc/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f4e566c6162732f63756c65) |
![GitHub last commit](https://camo.githubusercontent.com/159d7d827ce3b92faf0955ae8b31b4661598cb2610ddd023fb624ededc9758ca/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f4e566c6162732f63756c653f6c6162656c3d6c617374253230757064617465) |
Cule |
gpu |
Atari |
![GitHub stars](https://camo.githubusercontent.com/e2c14aa2e69b719e50ad08b3c9e62acbecd654135afb9e76e95d3ee4e9017283/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f676f6f676c652f62726178) |
![GitHub last commit](https://camo.githubusercontent.com/25d4628bdfd71d8abd299cadc367ba5925dcd80ec9dbe5db4b8509d96f48f9a8/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f676f6f676c652f627261783f6c6162656c3d6c617374253230757064617465) |
Brax |
gpu |
robot |
![GitHub stars](https://camo.githubusercontent.com/cf1cc664cf161eef3e1b2e160473f6782695c467ce5cadb948564126011bf5a7/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f4e56494449412d4f6d6e6976657273652f497361616347796d456e7673) |
![GitHub last commit](https://camo.githubusercontent.com/8a264892df54d0953c4a058e705a6ecdd8110a03d01b9cc51e49f9c8f5408264/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f4e56494449412d4f6d6e6976657273652f497361616347796d456e76733f6c6162656c3d6c617374253230757064617465) |
Isaac-gym |
gpu |
robot |
![GitHub stars](https://camo.githubusercontent.com/de261d0aaa7d6c2797118069158239ce9528049d63acc2dbf7ef3500f454e496/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f73616c6573666f7263652f776172702d6472697665) |
![GitHub last commit](https://camo.githubusercontent.com/e2cdac2caf5bf82864d0fcab0e24e54c86ea73909747e8e41d5c6bca45342d83/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f73616c6573666f7263652f776172702d64726976653f6c6162656c3d6c617374253230757064617465) |
WarpDrive |
gpu |
multiagent |
![GitHub stars](https://camo.githubusercontent.com/dce24492b23aeeff5799e4a1183720206012eb9fc366c28fef48cda1757f1a9a/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f73746172732f42616d34642f47726964646c79) |
![GitHub last commit](https://camo.githubusercontent.com/e1ca01de4a0a5fab316015a39a2cbe2df673e6f878fe6d9c299354c8ce58610a/68747470733a2f2f696d672e736869656c64732e696f2f6769746875622f6c6173742d636f6d6d69742f42616d34642f47726964646c793f6c6162656c3d6c617374253230757064617465) |
griddly |
cpp |
grid-world game |