Advertisement
Not a member of Pastebin yet?
Sign Up,
it unlocks many cool features!
- import numpy as np
- import scipy as sp
- import matplotlib as ml
- espaco=[0,6,1,0,2,2,3,0,0,0,1,3,1,0,0,0,4,2,2,5,0,1,1,0]
- accao=["norte", "sul", "este", "oeste"]
- PAndar=0.5
- PParado=0.2
- PSeguirOutra=0.3
- FD= float(raw_input("Qual o fator de desconto?"))
- E= float(raw_input("Qual o erro maximo a tolerar?"))
- #iteração de valor
- n,e,s,o=0,0,0,0
- def iteracaoValor():
- #for idx, val in enumerate (espaco):
- #U(idx)=0
- d=0
- while d<(E*((1-FD)/FD)):
- for idx, val in enumerate(espaco):
- def U(idx):
- if idx < len(espaco):
- valor = espaco[idx]+ FD *(PParado*espaco[idx]+PAndar*U(idx+1)+PSeguirOutra*U(idx-1))
- print valor
- return valor
- if (U(idx)-U(idx+1))>d:
- d=(U(idx)-U(idx+1))
- return U(idx)
- print"A política que o robot deve seguir, utilizando a iteração de valor, é:%d\n " % iteracaoValor()
Advertisement
Add Comment
Please, Sign In to add comment
Advertisement