Advertisement
thibthibaut

Untitled

Nov 24th, 2015
78
0
Never
Not a member of Pastebin yet? Sign Up, it unlocks many cool features!
text 0.84 KB | None | 0 0
  1. trans = [ 2, 4, 5,13;
  2. 1, 3, 6,14;
  3. 4, 2, 7,15;
  4. 3, 1, 8,16; 6, 8, 1, 9; 5, 7, 2,10; 8, 6, 3,11; 7, 5, 4,12; 10,12,13, 5; 9,11,14, 6; 12,10,15, 7; 11, 9,16, 8; 14,16, 9, 1; 13,15,10, 2; 16,14,11, 3; 15,13,12, 4 ];
  5.  
  6. rew = [0,-1,0,-1;
  7. 0,0,0,-1;
  8. 0,0,0,-1;
  9. 0,-1,0,-1;
  10. -1,-1,0,0;
  11. 0,0,0,0;
  12. 0,0,0,0;
  13. 0,1,0,0;
  14. -1,-1,0,0;
  15. 0,0,0,0;
  16. 0,0,0,0;
  17. 0,1,0,0;
  18. 0,-1,0,-1;
  19. 0,0,0,1;
  20. 0,0,0,1;
  21. -1,0,-1,0];
  22.  
  23.  
  24. policy = ones (1,16);
  25. value = zeros (1,16);
  26. g=0.2;
  27.  
  28. for p=1:100
  29. for s=1:16
  30. [dummy,policy(s)] = max( rew(s,:) + g * value(trans(s,:)) );
  31. end
  32. for s=1:16
  33. a=policy(s);
  34. value(s)=rew(s,a) + g * value(trans(s,a));
  35. end
  36. end
  37.  
  38. states = 1
  39. a = policy(states);
  40. states = [states, trans(states,a)];
  41.  
  42. for r=2:9
  43. s = states(r);
  44. a = policy(s);
  45. states = [states, trans(s,a)];
  46. end
  47.  
  48. walkshow(states.')
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement