From 7232b23ebcd04b71fafc5c8b412724113ab77d2d Mon Sep 17 00:00:00 2001 From: Shubham Jha Date: Sun, 11 Nov 2018 01:02:12 +0530 Subject: [PATCH] dix version number --- RLkit.egg-info/PKG-INFO | 38 +++++++++++++++++++++++++++---------- RLkit.egg-info/SOURCES.txt | 7 ++++--- dist/RLkit-0.2.0.tar.gz | Bin 0 -> 6235 bytes setup.py | 3 ++- 4 files changed, 34 insertions(+), 14 deletions(-) create mode 100644 dist/RLkit-0.2.0.tar.gz diff --git a/RLkit.egg-info/PKG-INFO b/RLkit.egg-info/PKG-INFO index f89f0e6..55dc159 100644 --- a/RLkit.egg-info/PKG-INFO +++ b/RLkit.egg-info/PKG-INFO @@ -1,27 +1,45 @@ -Metadata-Version: 1.1 +Metadata-Version: 2.1 Name: RLkit -Version: 0.1 +Version: 0.2.0 Summary: A simple RL library. Home-page: http://github.com/shubhamjha97/RLkit Author: Shubham Jha Author-email: jha1shubham@gmail.com License: MIT -Description: # A simple agent trained to play LunarLander using Policy Gradients +Description: # RLkit: A simple Reinforcement Learning library This project is still a work in progress. More algorithms and detailed documentation coming soon :) - To run the code- - ``` - python3 main.py - ``` + Currently supported agents- + + 1. Random agent + 2. REINFORCE (Policy Gradients) + 3. DQN + 4. DQN with baseline + 5. Actor-Critic + + See examples for details on how to use the library. Requirements- ``` - gym==0.10.5 - matplotlib==2.2.3 - tensorflow==1.6.0 + tensorflow==1.11.0 + gym==0.10.8 + numpy==1.15.4 ``` + + ## New in v0.2 + - Added DQN and DQN with baseline agents + - Added ActorCritic agent + - Added support for various activation functions + + + ## Upcoming + - Duelling DQN + - Support for logging and plotting + - Support for adding seeds + - Support for custom environments Platform: UNKNOWN Classifier: Intended Audience :: Science/Research Classifier: Natural Language :: English Classifier: Programming Language :: Python :: 3.6 +Description-Content-Type: text/markdown diff --git a/RLkit.egg-info/SOURCES.txt b/RLkit.egg-info/SOURCES.txt index d0d0b40..78fcfa4 100644 --- a/RLkit.egg-info/SOURCES.txt +++ b/RLkit.egg-info/SOURCES.txt @@ -11,7 +11,8 @@ RLkit.egg-info/top_level.txt RLkit/algorithms/__init__.py RLkit/algorithms/agent.py RLkit/algorithms/dqn.py -RLkit/algorithms/gpi.py -RLkit/algorithms/policy_gradients.py RLkit/algorithms/random_agent.py -RLkit/algorithms/utils.py \ No newline at end of file +RLkit/algorithms/utils.py +RLkit/algorithms/policy_gradients/ActorCritic.py +RLkit/algorithms/policy_gradients/REINFORCE.py +RLkit/algorithms/policy_gradients/__init__.py \ No newline at end of file diff --git a/dist/RLkit-0.2.0.tar.gz b/dist/RLkit-0.2.0.tar.gz new file mode 100644 index 0000000000000000000000000000000000000000..70d762734e2598b3a673b3a25611cd0f569d00a9 GIT binary patch literal 6235 zcmV-h7^LSPiwFqRG3Q$X|72-%bT3j&YiV>XFfKAKFfMdqascf;Yje}cvV6r=`VUj# zgYCt3EWdKrb$#mQ0L$er1QytHKIEi?Vow|`vLy6?WViV5r+eOd*s&oo>>f>}VriZ| z)7{fO-7V?$^Y>ob?e_+~{^7klN_|L2M`Qf8kH&rTSEhURaCl@-hW(?#=w9C*PDYb^ zWPEQADN9l}CgfgnnVny{tF`rRDwh+HzkibS+Q9#-pPzQ0o&5CjF7Q8@jMm|QFghyY ze{_WS@7MUh^YntI?!ryo?muaqcwsOlgPz?uaaVLo7;Q9E0V9&en{2gm2G>xW*hf6PomFvyJ)uC9z-!9!Bj}Cd~$60zA##8c! z7m@$JbVXj5u3XQb5~yv9hX1?7EbOZB+?&%Nfl*#Od)s(SlX>h#DTDF>2it^?dcj2) z&*_Q=DS1xaIPij{gxP8kk@VHuOD`c&9R5b%a|rfkGu$D zN?d;##xTuQLfl|M7O&dkP!eIhfPAbp0=xoeU!y9RQIn*l0{J%r_cv1 zWsoM_s_J%+yoT|@6|bZV22k(>8Ts|2C#3Z%^u75tc^bP55BoBP9`?xNUrzM>h~1M< zFc)&}Ce-%=s!PW`ay(A~Gml`h-nIm@1lC-vMM7ZCm*FRph9pZUNiV4) znW}DH(+`;!Gklp-fA{X4zDWW9VSM3-pJp?=XWPBLE?Zu&X0v|J?)UztGlOguU9-C5 z-e^sy`s%?0azZ~LvOfad>-;V`UMv7FxK4=d(s~Jum0Pg2<4adWn5-hu&Q|WD8+%~} z6g5x1kDP)ovS5xENfp33(0`3MwV6Xa&ZzGr1?EuRC2x#D{cyR&Dmb&q57V^JhgsKM zEEqjgx=7a5nZxc1^htw{UK|DtpN&_(n?l)YN`5{0`Q+ulP8yGVH%Yt;kHSXqEC9r^ z<;sv;=afugcbK!w!`Czc?ww!eTAa9P7P~%q?gq;Y78V;k36{Q>@+F8N)KV{d%p-j1&w=ukz~q$cHN`PWfwQh!*8hn zO@@BcjXh9?7^+8>L%_5 zZEP@5H8vey#RRmRu9%%s$ad$-lEsIhGCyW=*je8&0}UdnEQy$Sc9v2+9~yFEy9P?u zZ&%%z`ey#GLeCwY|Lp?*4@SfK{J)n}AN}j|{~G=`x8A$8|4aVwkA{<@0m}bLZU3wJ zzfSw*f2jf9_845pKU&BC_OL%v@_&MUVtYJ1>eu|gk8}~k`J5p>4MRU6-ijUGSx$#s zc)`Mn-1&RZY~he^@k2r@a94EJWTeyV$g}@PZYP{I88PYng+5WwnpH+aT{VmSS#uk^ zp>E~*xs|b|*&)phHX1D6$~4o|aDZ0gpjI;b$@LT3u6OZU z)c@`v3ViqYpV8!KSjYc-8~o?ZJbRG;{i6}n|3UPRk48fq{eM6Swfx^l67n8|2#R;M z!Nbn1C}0Y*V?i&7G#a%M>R)uwpzoj(&>=AjfLLtASo=QK=s^XL5YTIH<-VsaS--6+ z@ODs#U#R@lThSz?5tQ^*<{}IzWUxVu9zYpswGnIvBEQEX4o7&N&{%j*W<)}zo87-3 zgEA8b#Hgq`LlDGVUFLJ)eR>zffSzUDH+sfQ-nG#uuF)qqUUUdfqeJj)Z34uG5`$Dj zRn>!nbnb@)m z?0@!PJQ)c5_Xnd1+W*G(i z6qpEwV|WtLdD0v^v)4pnN8{8Jr9a{@O2jz? z#P5uaA#-JI%oo?P$N+*ssc|c7n2=!=^Ip~wz+wOVQWo$zFo4*lF)SJZ5;#s%>{J2I zgtS>ITfiyZ;rWSbVAksevL=vjN}a^}y`pDBe-O=*OE;pY{WIBm6@G*Rx5IS{>;RF` zkfn~hSU8an4KG6<^qQpAh9dZTfWazc6)vc+Rz++S7hd4{j_+QBW+wq+{jl1tCR=mB zsR6t(LXJ+_vg?nopV55JRb6vjZRp!XW;?%tY>0&8E(H|hC`oUD)}U533>{*3$a@+G z)MxbWxjrBPX%^a}y(jk0Wj|N$M~}v4wN|@hg!Kp>;5IcApr%-GlK_C`ymS+&WlV@A zF{tWpK+i$gY!?8JVjxHbcM$ZF@FHEgSFQ5wV1z3#nc0PoSr58jsO$LNd+K|aVYnc2 zLBeGV=iz&ibAHVivQ>hk1A7UVJsq~IV3MO@(`H-V6u;cKaGNGm?2HZbK!=LPke}q`h%d?^zO3MQa^-<%pGUX~0*kQ-+zA?mx*^x$Y}CyhGNJSzB%xaBcxbCM643&1!uj>EWBNn%y=F_)aPexAYkin0=inKk&x zuy9_`J6^b}msrGh);s}dxnCrj?vkbwFhrmW(Fo z3My`Pkjur)8&R(1Fb^sRhPH3m#t6NQ{T3J;WRQ zv@~0uXBQWsV{ix|^V20DlLTSPj9qMC*4@LI&93QHL}Tu3nvp*~vpl{jkesgE0`S^} z7NZ;r4rFfQZC!g=Aok+-3uT(!Z&{+#&3TDwrOU zmfbb0wV~e5V3bK*E=+ky)*y<#AZ;By;S@dnmW`qWGHg0syZyPXM&$}SRObP%z4>M6&1uW`lC;IQh@uXM zk~f-}0Kti~tTC$>VK2J17|Q&YN%Zl`b6E%aN`u;sRuD0)F{3zRM3X)T9- z$j=#jT6myxWz5`{vFN>{!mnmPH zV#a5s1ya~98S)}GN&d|CfAdj;+w%Y0gOPgvr#~3?hxht}(XemV_Wy5c|F^0g06I!Q z(SmdUSQ|V5AmZ`iS?L4d2324S4-_nE^8Es5fK}}cur{~@R9OxrrXQFYs#=y%M?Kql z-v~kgmAi5psCDDzLT zYokMg1v;#CNnn{(a7tJ^dL=|PK>r5!L5?`uW-N$_p%T7t8oPk~4FFWqNn4LsaAkaF zo(zenDqqI;?#ZyKT^V2N$gtLUGWO!fC~_6|WLQ9g#&Y5BD(VJo2wL8Pwvp+*q zLEip(DO=obi@AP`{V$fa#&@D<+3;WN=DyhIw_py7Ed;n8-BH-w5so#?ScIsG zSP(*MgHy%Y;8n49aI09i>sN`Em3|eg+OcANfoDb0%?96!;Z-rWGnILxXT_>?t?0cP zyYiX3T{c9|PR~r~TJW{-q8q#|R?*#JZSc2Pro+Wr?{TpzT`pFI&&4vGF8oHA82|We zZFacm+S)kF92sVTawi;q0!&E(dut)Z}#UC{$j(wwWa0X+GzT>Zm|7xARPxt z1pf)cKl?Ftn<~?P$+%yo7l|Tf@h59_n%(UF)~y=;^R|3t#9yPKO-)YvZ0H=^l5c&N zru;qF|MTw-x}ErcxakY~|M&|+e|FqBNfAt$Ch?|h~Lc95xbFbvv<1!FV;0cA( zQu++v>4DD+)5R0CWfczTTi4d&_2$Zk8$~GoXn}ON6_e#NhhdbZIU6qbDis_$%>1v< z4BRJ>I4hSOdNI3+)*&};PFZV~6H`BHPPr2RuX%3bEmxtpkOktFm!)oSDGTr#Guern zdnwd`TpCuT4MZ4M^#p}J$P~vbP~@0@DW^T={Z-=V2?t(Q^|Xn`-{#qD)?^NsrYOe> z-qmc@m-ienQuffWbwz+n3)~@D;ISex6e{b@Gt=23&i%$JpNhIVyLooj&HtwfyI=JH6xgf7s*UNId^L9`r|J_Wr*?zn1@d)c>o(f7WUSyh$-ENL)pWbCl3h zdwBfI$rpqN39APSBte5bB*=8r`K8Jm{Hq-!S-U8z!?J;dD9 z&3Jq4ARl%loSL9kfUM-g^Z|MM^6|@-po;dC#h--igw=&1h%oMScvNvM^BMZRE^Kw-f3a_+ z^q84mu%K5&1_0%UszPdYeACY1OHGFL(8HMa}GQe)&*ree@j9+dSFPh~o7SHZi*V8z+(IOZmmJU5rN;XeK# zW3kqRHx)qNS8UUVTu7Fn8u!Y{gIkUSP!Uca)Z+yC;3l(^rttXNXJ&vJ_30dK=r;{j z8FZkBU1#uBkwV3Bn#Di_0oEpz7AeNWtSGw)!PO-CE%7WM+6mo-$?lAG85I9j$S(nL zOEi$*)Wj%U%*cVW_Fe+z?kY^KDvE7yL2O?Z!N$>$kgt85Ke@f=HKj&@R0P$G#?6Yb zt5Ue84)$Vg^!Rd$Do&bS+lJJv&^x}EXnkA0}!DU zhLNMFo2!%J8%kK8^#RvtA^Y8nSdbCq%tIen03!z==P3p%{Y`RDQL zXUG3|{^X6YEY1qDo`uYPaX%#iV@jCfq*UmNno18}#Jdbyc*)U^;UK7FKP0V|O}cEE zAj_!GHiD#q0vn&x{1w2z<|xI+Gi6po({m3S=YMm!Vu_k$| zfNWcg@DltXP0Ce7&4#EX`us?FD}fwv1Gn6-vNE*3GEh+Ce5)uxe1>CP^dIgmP-ga6 z6`psX_N)#$;9+_PGXCy>H)a_Xp?C*=EK4vx=72@>9jpn_TNe^j3{Vs6s09q}N+3IA z;8;=AP0a(N*ucZ6ZM>MbK)_C1ExqR51%YjNWYZJGSC`q$08DGe4B5ny?Rj zt_x^HO;Q-Zj6+{V4CaSjUVgA+{3TEy9%bbaJI7Q?i?ERDY{CnNuQ2j=ZXwLo?~s*L zYV@wzDbps8b*+BOL^(<`H$I=r?r*86=w$m~&qCvha7eCHIM7S6J0X;I>1@8wlk+5^aDicTX1sxi|M8Cx&_tp-OEYPL0 zy0q-BL?ZAp8?-GWNH@JFq7*E;d)Vie@tk5h)BKsX80CqJR{MCr*#9fPT6wqeUwwN# zmfwFHusG2{e>|zAHf4J!@*>@@b2lD$LW8nV582I0|$MyGL_Za_WZuIKu4!tMHn6Jf$ zK$brK<-}?{AUwbLoKWcj5!pdG&a9Te-y8qm64UR(|6~3Am&x#megDZG)cn84_)oRx zZ@U#3EsDEBslxW#gKksr6#M6Y{{83q#qyTNxbge%qewxRuZ$bb1!>pS58P2YbXjOF+L29y4XegEAa*6)AaOL{;U z1x$(lGCRfXAfB^_F7-EX#Mj#Ky#4mlOGp%lztMS${?a7%e4n@kgQn5b65;2((J??? zgfS&rsuR#7$bzP>=To={=NXQ{pEjF^?DOAAh#&lBo}Wiq97C~xO_D4^JpkG;wIJzY zvE37T3D2||gPztXNb40-I>=M0bU>HG9#>FC?3b_rK>6Y?t1<5JXWqN~p?4hO4W)!$ zF#|!u+*Ta+gaC|};U|31BTFbrFRA*NJvMvIzu~?TpuT(e&T5oD;chjIFSlEb+_%|9 zBRF9_ASd(_F6u|%QLE9#Cq`f$5Pn?D(mccp>6+%F{bHeHkyutDLglHcDST+Zy1iTtw zqOMKHb*fXH>QtvX)u~Q(s#BfnRHr)CsZMpOQ=RHmr#jWCPIanNo$7Q$`VVr>gdqUP F006G$gx literal 0 HcmV?d00001 diff --git a/setup.py b/setup.py index ff684cc..550cf7c 100755 --- a/setup.py +++ b/setup.py @@ -1,13 +1,14 @@ from setuptools import setup, find_packages setup(name='RLkit', - version='0.2', + version='0.2.0', description='A simple RL library.', url='http://github.com/shubhamjha97/RLkit', author='Shubham Jha', author_email='jha1shubham@gmail.com', license='MIT', long_description=open('README.md').read(), + long_description_content_type="text/markdown", install_requires=[ 'tensorflow==1.11.0', 'gym==0.10.8',