env.py 998 B

1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556
  1. #!/usr/bin/env python3
  2. # -*- coding: utf-8 -*-
  3. """
  4. @author: huiming zhou
  5. """
  6. x_range, y_range = 14, 6 # size of background
  7. def obs_map():
  8. """
  9. Initialize obstacles' positions
  10. :return: map of obstacles
  11. """
  12. obs = []
  13. for i in range(x_range):
  14. obs.append((i, 0))
  15. for i in range(x_range):
  16. obs.append((i, y_range - 1))
  17. for i in range(y_range):
  18. obs.append((0, i))
  19. for i in range(y_range):
  20. obs.append((x_range - 1, i))
  21. return obs
  22. def lose_map():
  23. """
  24. Initialize losing states' positions
  25. :return: losing states
  26. """
  27. lose = []
  28. for i in range(2, 12):
  29. lose.append((i, 1))
  30. return lose
  31. def get_reward(x_next, lose):
  32. """
  33. calculate reward of next state
  34. :param x_next: next state
  35. :return: reward
  36. """
  37. if x_next in lose:
  38. return -100 # reward : -100, for lose states
  39. return -1 # reward : -1, for other states