From eebe6ea753199a68a0aaafbb35a406736e7a9cd2 Mon Sep 17 00:00:00 2001
From: Jin Wenyao <wen-yao.jin@student.ecp.fr>
Date: Fri, 24 Mar 2017 01:58:17 +0100
Subject: [PATCH] go

---
 __pycache__/agent_afterstate.cpython-35.pyc | Bin 9015 -> 8999 bytes
 __pycache__/logic.cpython-35.pyc            | Bin 3681 -> 3681 bytes
 agent_afterstate.py                         |  10 +++++-----
 3 files changed, 5 insertions(+), 5 deletions(-)

diff --git a/__pycache__/agent_afterstate.cpython-35.pyc b/__pycache__/agent_afterstate.cpython-35.pyc
index c98f07408ce6dd5b46f6601976789ee53da6ad7a..072919ca89ffc8dd8cc1e54a537e19784fcef4e9 100644
GIT binary patch
delta 1530
zcmdn)w%m<VjF*?|c;1zWmm4{cGIDV+FfceUFfbG|PrkvZUf;sT5XH=p!pV@r#n8gQ
z5XHif!p)Gv17@=_r0_DN@PXNE3@Q8!DFR?NJ41>fLy8cX&B2f&%#b1iW^*#6h%%&z
zf!SOPDdG$%5)3Jl3@wZdQQQnEQVc25U@0Dk6d8sTSunevmmx)tAw?d{;bTZqU`SB}
zv-!dLl^9Z#8B$ajT9_E31Q=3O8B)~1vVsgL>I^9wV73rLiY7yf7MLx}kfP0yq621&
zfJ_M1)V;-@m{yWnR9uo+lIobAnpcv}00rsQB9oZeCkrr(aDqYwB+4;ampOoog`tCi
zA)be!hGlX)vn&@Im@B|g!#;T(vn(U~<TK1VjI5J?GMh27PBvf(7hz>6ieW4f1u4st
zW@u()V60)?Jewt&NtB~VhJk_M7ISW5Ns%f814EG#0|UcmA@(|UMw`hK`5tpSf&?u<
zg!$xpeqBx{kaEV9BCE+;`QI=)O<p9BCgcf{7Gz*x&}0G|SLC@_N>GN8(Q>l6&|F5#
z$ybHkc)gINCu;~_WAvW<Usy~7tQTx3OLBg0(k;fKA}g42MIbYagg{)6$+jZmjLe%u
zMfe#R8z!fUx(a)PT*8)El%AVdQRD+sWIlPXsIy=Q0|P@XC;@@PjFE?FvY^=OdPat3
zCWcxTh8h-z6lMl<2&;yTp@yBorf?BMcnSkUuqKNia@enPe^}LG4;A@fugO`Y2C@Z|
zIEz3ba*H*yBsI7A7IQ&<L6Hqe$`?fVf!xKMo?4;_3EU!g1_lPEBCE-D;^vGko41Jz
zGV+E(LPH#+K5X(83020~lYdEA)r0(06b=%FcnHK21re+uLpe)Qi%a73QY%V|{6Pk=
zLP9$Uq#zQcfD4h5ih@C+pa9flDgvtjMKm}tZ?VUhBo?Komdpf&5*sL4F<CK6Fjk3A
z-YmI*k!5m-)H6v-n0BN{kYr$BSUx#e+J@17@&su~c~6j<WDo&%H`vMGAkYJec}+ec
zt*B-XVuHiX0OVw7kbqoU1lA6Ut)i64{4%0gtpo+s{K>X5v*Zw3K%PQ!703ZwHh+~_
z##o;SvJ8}hi&8->gj>LIrVkPm0}&wS-eM^(EGj872Jv-3fyZ22Qd9&EY+H~^IT3+-
zi>)ZNJh3RHC<UaB4H9@o5+I%NAQ8sAB54q3vXs0$<Mz!~@)?ZQ>9b~nz)t%jPLOHb
zMRp(+Ah#ApfLLJ9tAkkPAR{<SiW2jR3-XIoi}EMmRFGB42I*o)xS=Qqq>Ql`60dn6
zjh2(86r~uCPc~I-5(gUx%40>K<Ok1(lg}xNGv1l}Owl^b45UQ^L}-BsZ4hAsBETtE
z7sLYV2c@hc4-gj|HQ*oxhbAa0iohPo2g#Oz2&2i2%Hoszlmx`&<ak7Q*m&4@IC$82
lxOkZPIe7SZ*e7pM(iQ}VHfLr@YEemkeok?b%j6GA?f}zFHdp`v

delta 1498
zcmZ4Pw%v_WjF*>dvh<aR+>M+^8M!za7#JKF7#ND#Cf{IGuTSA*XkllFVrEF;Vo2d;
zXklQ8Vqr+(VMyTxvsoEZ_!v_7!E82$6aj`5K`@)0Aw`HGMHtNHU`P>RND&3IIT=#K
z7*fQ+Y%Ycr35FC&h7>7=7Dk3BZiW<Th7=jF6c0m+EJKPMLrW?HLliGViabM#0$75N
zAw`iPMG4I22kTd6NKs)(QDtahVu%u8NKs=*Q3uNkGNfoQq-cWKLJTQd3@O@RwlG7A
z4nvAAm@NV_Ay`vy@&hInwKOnzXP;gzvd;ZsRf~N{5gP*oLlHXz14A+>R2Uc-7&s>@
zG6!(6GITI7#PcxJuuiUKmepVfa|IY`I2clx7_yldih4mJS%M7B3?N3l5JR3WLk-8|
z1I#*%Y?I$In=!IYR$&PjVPhzYVJr~^smYRNXl7(!tYO>S&l1ff!&xN5z`$^eIXAJS
zNEPG?B@mZ2Jux>oar1w+I(A0e$#r~>xt&0AmLS4nat^;Pk26RaV@i=V0|Ub(d6CIG
z`L8lMPwp2;6Y>Hn5@cXt&}0IeUF5ZyT~LOR(Q5KVF5$`MLS0bSRUu<uZ)9bYMTM_v
z`+&@4$;nSQD$)c=vO&!N849+OB{@Gg=@w&Aku}IXNlyj_hI~*e;sJ#kBO9YIqX?rq
zlOW?}ClP)|#@fk2qOQVVL)j9G(sL6lihMyvSxjCf>MR(_z`#%q(#!$Y%)>bOpXlp)
zW`<@ahFTVe8Wx5W76x+&tA>rChMmEta1ldz3Ijv1CaYgMNDm0Z<FSYlWHcx)H93pa
zKx{`40SdKSteGXLxy84b3-Sw!Y(b)aAi^KyTjuoC5={<>KRp;2m>G(!CufP9Gd6Bs
zBreFv8wLsnrXq2W`tZpIBvct^OnxR|B>?hNQ3Oa7>LUY5Nw)xyVpfP*$soBXkPTdk
zX(g#e#U+U)sYM|mQE2plRe<8ZNC>2iJ-#HdC_S}g+T?!84U9~a9i*N?;)+$0fq`Mk
zWP52FMu*8Y(vtGvI8FhX1a<}30bmd5fyBHgZ;@8C0p)E-C>Veo1@$1vJw;&cpujIm
z1=-7zlAo6v#aWP%8J}2Glvr5=PAaS*kI$K`DKm==q6rk=tRPD_Zhk1Uj8QWQWEUv8
z7Nvn$2>ZdIt`8Cu0}(!xH^|B9*nu1YN$o`-f8Sy&N-a+;N`W|m4dU}636O?_$-m^Z
z8Mka!lh0r@heRqUTWWF_*@L7(PAG~5vB3UN2eB+b{@^SrO3W)R$S+PUDwupyK~^OP
zWG6dPY~+HJF&0B20hDZutR{0QN--Xptg6@~4mJ*yC5k}l0-k-q{x)J@V7NK?nxb`>
zImkW@5TOMkv_XUkhyW)mT@VXw1}G^MfwD&tIHbX$1r8`sxE6suQ2<h03L=aqe^e5m
zT&E-;rYOfF!o$YH#>2tG#>2(K%+JBY!^1XtiITP;D6VgDW|pKDmE`B=6c@QpexT$I
E0F`?-lK=n!

diff --git a/__pycache__/logic.cpython-35.pyc b/__pycache__/logic.cpython-35.pyc
index b6f2e6f8362795f1630ed908724d5b72ef96b480..dd61672a13e9ee6b4c277e0eb230bfb7d2b4d481 100644
GIT binary patch
delta 198
zcmaDT^H7FejF*=y%lpbk_QRZvw<e$FjAc<~U|^VdQEc)bo<?pd1_p*AIS`>d`5c!A
zi#k-!fP0QONL`T%0|SF5bCD`Yi42HPoBWvDX!0W-smc00c{tT<;n8E!gqrn-ryHlb
fdA!DqT9YsFT8M&e16g0B0kQ_9xkziWJf9N)Pc$l+

delta 202
zcmaDT^H7FejF*>-@6`E??1woSqb8r`jAc<`U|^VdQEc)bo<?pd1_p*AIS`>V`5c!A
ziyBnUfP0QONL`UK0|SF5bCC*2i42HPo&1>Fh(#T$PM;?ar@AdXdMp}Hb$@ueajKig
eYs{!Q`4X>%DA-1j6N*6Q7lAYvX-<~sa{>TeGAbwl

diff --git a/agent_afterstate.py b/agent_afterstate.py
index 49533e2..312991a 100644
--- a/agent_afterstate.py
+++ b/agent_afterstate.py
@@ -11,7 +11,7 @@ class Action(IntEnum):
     RIGHT = 4
 
 class afterstateAgent:
-    def __init__(self, mat, TD_lambda = 0.0, alpha = 0.0025, gamma = 0.95, epsilon = 0.01, verbose= True, symmetric=1, tuple = 2):
+    def __init__(self, mat, TD_lambda = 0.0, alpha = 0.0025, epsilon = 0.01, verbose= True, symmetric=1, tuple = 2):
         self.state_per_tile = 12
         self.commands = { Action.UP: up, Action.DOWN: down, Action.LEFT: left, Action.RIGHT: right}
         self.alpha = alpha
@@ -143,8 +143,8 @@ class afterstateAgent:
         else:
             self._reset_trace()
         for tr, ind in zip(self.trace, self.index):
-            v = tr.get(ind,0)
-            v += 1 
+            v = tr.get(ind,0.0)
+            v += 1.0
             tr[ind] = v
         # print(self.trace[0])
         # print(np.sum(self.trace,axis=1))
@@ -164,7 +164,7 @@ class afterstateAgent:
             return -1
         if done== 1:
             done = 0 #1 means no reward
-        phi_array = np.array([w[i] for w,i in zip(self.W, self._index(state))])
+        phi_array = np.array([w[i] for w,i in zip(self.W, self._index(afterstate))])
         if act:
             # in the act phase, explore when there is 0
             if 0 in phi_array:
@@ -203,7 +203,7 @@ class afterstateAgent:
             return
         s,r = self.test_next(self._action_index,self.state)
         n = next_state
-        if self.symmetric>0:
+        if self.symmetric>0.1:
             for i in range(4):
                 s = transpose(s)
                 n = transpose(n)
-- 
GitLab