From eebe6ea753199a68a0aaafbb35a406736e7a9cd2 Mon Sep 17 00:00:00 2001 From: Jin Wenyao <wen-yao.jin@student.ecp.fr> Date: Fri, 24 Mar 2017 01:58:17 +0100 Subject: [PATCH] go --- __pycache__/agent_afterstate.cpython-35.pyc | Bin 9015 -> 8999 bytes __pycache__/logic.cpython-35.pyc | Bin 3681 -> 3681 bytes agent_afterstate.py | 10 +++++----- 3 files changed, 5 insertions(+), 5 deletions(-) diff --git a/__pycache__/agent_afterstate.cpython-35.pyc b/__pycache__/agent_afterstate.cpython-35.pyc index c98f07408ce6dd5b46f6601976789ee53da6ad7a..072919ca89ffc8dd8cc1e54a537e19784fcef4e9 100644 GIT binary patch delta 1530 zcmdn)w%m<VjF*?|c;1zWmm4{cGIDV+FfceUFfbG|PrkvZUf;sT5XH=p!pV@r#n8gQ z5XHif!p)Gv17@=_r0_DN@PXNE3@Q8!DFR?NJ41>fLy8cX&B2f&%#b1iW^*#6h%%&z zf!SOPDdG$%5)3Jl3@wZdQQQnEQVc25U@0Dk6d8sTSunevmmx)tAw?d{;bTZqU`SB} zv-!dLl^9Z#8B$ajT9_E31Q=3O8B)~1vVsgL>I^9wV73rLiY7yf7MLx}kfP0yq621& zfJ_M1)V;-@m{yWnR9uo+lIobAnpcv}00rsQB9oZeCkrr(aDqYwB+4;ampOoog`tCi zA)be!hGlX)vn&@Im@B|g!#;T(vn(U~<TK1VjI5J?GMh27PBvf(7hz>6ieW4f1u4st zW@u()V60)?Jewt&NtB~VhJk_M7ISW5Ns%f814EG#0|UcmA@(|UMw`hK`5tpSf&?u< zg!$xpeqBx{kaEV9BCE+;`QI=)O<p9BCgcf{7Gz*x&}0G|SLC@_N>GN8(Q>l6&|F5# z$ybHkc)gINCu;~_WAvW<Usy~7tQTx3OLBg0(k;fKA}g42MIbYagg{)6$+jZmjLe%u zMfe#R8z!fUx(a)PT*8)El%AVdQRD+sWIlPXsIy=Q0|P@XC;@@PjFE?FvY^=OdPat3 zCWcxTh8h-z6lMl<2&;yTp@yBorf?BMcnSkUuqKNia@enPe^}LG4;A@fugO`Y2C@Z| zIEz3ba*H*yBsI7A7IQ&<L6Hqe$`?fVf!xKMo?4;_3EU!g1_lPEBCE-D;^vGko41Jz zGV+E(LPH#+K5X(83020~lYdEA)r0(06b=%FcnHK21re+uLpe)Qi%a73QY%V|{6Pk= zLP9$Uq#zQcfD4h5ih@C+pa9flDgvtjMKm}tZ?VUhBo?Komdpf&5*sL4F<CK6Fjk3A z-YmI*k!5m-)H6v-n0BN{kYr$BSUx#e+J@17@&su~c~6j<WDo&%H`vMGAkYJec}+ec zt*B-XVuHiX0OVw7kbqoU1lA6Ut)i64{4%0gtpo+s{K>X5v*Zw3K%PQ!703ZwHh+~_ z##o;SvJ8}hi&8->gj>LIrVkPm0}&wS-eM^(EGj872Jv-3fyZ22Qd9&EY+H~^IT3+- zi>)ZNJh3RHC<UaB4H9@o5+I%NAQ8sAB54q3vXs0$<Mz!~@)?ZQ>9b~nz)t%jPLOHb zMRp(+Ah#ApfLLJ9tAkkPAR{<SiW2jR3-XIoi}EMmRFGB42I*o)xS=Qqq>Ql`60dn6 zjh2(86r~uCPc~I-5(gUx%40>K<Ok1(lg}xNGv1l}Owl^b45UQ^L}-BsZ4hAsBETtE z7sLYV2c@hc4-gj|HQ*oxhbAa0iohPo2g#Oz2&2i2%Hoszlmx`&<ak7Q*m&4@IC$82 lxOkZPIe7SZ*e7pM(iQ}VHfLr@YEemkeok?b%j6GA?f}zFHdp`v delta 1498 zcmZ4Pw%v_WjF*>dvh<aR+>M+^8M!za7#JKF7#ND#Cf{IGuTSA*XkllFVrEF;Vo2d; zXklQ8Vqr+(VMyTxvsoEZ_!v_7!E82$6aj`5K`@)0Aw`HGMHtNHU`P>RND&3IIT=#K z7*fQ+Y%Ycr35FC&h7>7=7Dk3BZiW<Th7=jF6c0m+EJKPMLrW?HLliGViabM#0$75N zAw`iPMG4I22kTd6NKs)(QDtahVu%u8NKs=*Q3uNkGNfoQq-cWKLJTQd3@O@RwlG7A z4nvAAm@NV_Ay`vy@&hInwKOnzXP;gzvd;ZsRf~N{5gP*oLlHXz14A+>R2Uc-7&s>@ zG6!(6GITI7#PcxJuuiUKmepVfa|IY`I2clx7_yldih4mJS%M7B3?N3l5JR3WLk-8| z1I#*%Y?I$In=!IYR$&PjVPhzYVJr~^smYRNXl7(!tYO>S&l1ff!&xN5z`$^eIXAJS zNEPG?B@mZ2Jux>oar1w+I(A0e$#r~>xt&0AmLS4nat^;Pk26RaV@i=V0|Ub(d6CIG z`L8lMPwp2;6Y>Hn5@cXt&}0IeUF5ZyT~LOR(Q5KVF5$`MLS0bSRUu<uZ)9bYMTM_v z`+&@4$;nSQD$)c=vO&!N849+OB{@Gg=@w&Aku}IXNlyj_hI~*e;sJ#kBO9YIqX?rq zlOW?}ClP)|#@fk2qOQVVL)j9G(sL6lihMyvSxjCf>MR(_z`#%q(#!$Y%)>bOpXlp) zW`<@ahFTVe8Wx5W76x+&tA>rChMmEta1ldz3Ijv1CaYgMNDm0Z<FSYlWHcx)H93pa zKx{`40SdKSteGXLxy84b3-Sw!Y(b)aAi^KyTjuoC5={<>KRp;2m>G(!CufP9Gd6Bs zBreFv8wLsnrXq2W`tZpIBvct^OnxR|B>?hNQ3Oa7>LUY5Nw)xyVpfP*$soBXkPTdk zX(g#e#U+U)sYM|mQE2plRe<8ZNC>2iJ-#HdC_S}g+T?!84U9~a9i*N?;)+$0fq`Mk zWP52FMu*8Y(vtGvI8FhX1a<}30bmd5fyBHgZ;@8C0p)E-C>Veo1@$1vJw;&cpujIm z1=-7zlAo6v#aWP%8J}2Glvr5=PAaS*kI$K`DKm==q6rk=tRPD_Zhk1Uj8QWQWEUv8 z7Nvn$2>ZdIt`8Cu0}(!xH^|B9*nu1YN$o`-f8Sy&N-a+;N`W|m4dU}636O?_$-m^Z z8Mka!lh0r@heRqUTWWF_*@L7(PAG~5vB3UN2eB+b{@^SrO3W)R$S+PUDwupyK~^OP zWG6dPY~+HJF&0B20hDZutR{0QN--Xptg6@~4mJ*yC5k}l0-k-q{x)J@V7NK?nxb`> zImkW@5TOMkv_XUkhyW)mT@VXw1}G^MfwD&tIHbX$1r8`sxE6suQ2<h03L=aqe^e5m zT&E-;rYOfF!o$YH#>2tG#>2(K%+JBY!^1XtiITP;D6VgDW|pKDmE`B=6c@QpexT$I E0F`?-lK=n! diff --git a/__pycache__/logic.cpython-35.pyc b/__pycache__/logic.cpython-35.pyc index b6f2e6f8362795f1630ed908724d5b72ef96b480..dd61672a13e9ee6b4c277e0eb230bfb7d2b4d481 100644 GIT binary patch delta 198 zcmaDT^H7FejF*=y%lpbk_QRZvw<e$FjAc<~U|^VdQEc)bo<?pd1_p*AIS`>d`5c!A zi#k-!fP0QONL`T%0|SF5bCD`Yi42HPoBWvDX!0W-smc00c{tT<;n8E!gqrn-ryHlb fdA!DqT9YsFT8M&e16g0B0kQ_9xkziWJf9N)Pc$l+ delta 202 zcmaDT^H7FejF*>-@6`E??1woSqb8r`jAc<`U|^VdQEc)bo<?pd1_p*AIS`>V`5c!A ziyBnUfP0QONL`UK0|SF5bCC*2i42HPo&1>Fh(#T$PM;?ar@AdXdMp}Hb$@ueajKig eYs{!Q`4X>%DA-1j6N*6Q7lAYvX-<~sa{>TeGAbwl diff --git a/agent_afterstate.py b/agent_afterstate.py index 49533e2..312991a 100644 --- a/agent_afterstate.py +++ b/agent_afterstate.py @@ -11,7 +11,7 @@ class Action(IntEnum): RIGHT = 4 class afterstateAgent: - def __init__(self, mat, TD_lambda = 0.0, alpha = 0.0025, gamma = 0.95, epsilon = 0.01, verbose= True, symmetric=1, tuple = 2): + def __init__(self, mat, TD_lambda = 0.0, alpha = 0.0025, epsilon = 0.01, verbose= True, symmetric=1, tuple = 2): self.state_per_tile = 12 self.commands = { Action.UP: up, Action.DOWN: down, Action.LEFT: left, Action.RIGHT: right} self.alpha = alpha @@ -143,8 +143,8 @@ class afterstateAgent: else: self._reset_trace() for tr, ind in zip(self.trace, self.index): - v = tr.get(ind,0) - v += 1 + v = tr.get(ind,0.0) + v += 1.0 tr[ind] = v # print(self.trace[0]) # print(np.sum(self.trace,axis=1)) @@ -164,7 +164,7 @@ class afterstateAgent: return -1 if done== 1: done = 0 #1 means no reward - phi_array = np.array([w[i] for w,i in zip(self.W, self._index(state))]) + phi_array = np.array([w[i] for w,i in zip(self.W, self._index(afterstate))]) if act: # in the act phase, explore when there is 0 if 0 in phi_array: @@ -203,7 +203,7 @@ class afterstateAgent: return s,r = self.test_next(self._action_index,self.state) n = next_state - if self.symmetric>0: + if self.symmetric>0.1: for i in range(4): s = transpose(s) n = transpose(n) -- GitLab