add single file env

afb1dcac · hezhiqiang01 · 3f5c8460 · afb1dcac · afb1dcac
Commit afb1dcac authored Jul 02, 2021 by hezhiqiang01
Show whitespace changes
Inline Side-by-side

Showing with 46 additions and 37 deletions

envs/env.py envs/env.py +45 -0

envs/env_wrappers.py envs/env_wrappers.py +1 -37

No files found.
--- a/envs/env.py
+++ b/envs/env.py
+"""
+# @Time    : 2021/7/2 5:22 下午
+# @Author  : hezhiqiang01
+# @Email   : hezhiqiang01@baidu.com
+# @File    : env.py
+"""
+
+import numpy as np
+
+
+class Env(object):
+    """
+    # 环境中的智能体
+    """
+    def __init__(self, i):
+        self.agent_num = 2  # 设置智能体(小飞机)的个数，这里设置为两个
+        self.obs_dim = 14  # 设置智能体的观测纬度
+        self.action_dim = 5  # 设置智能体的动作纬度，这里假定为一个五个纬度的
+
+    def reset(self):
+        """
+        # self.agent_num设定为2个智能体时，返回值为一个list，每个list里面为一个shape = (self.obs_dim, )的观测数据
+        """
+        sub_agent_obs = []
+        for i in range(self.agent_num):
+            sub_obs = np.random.random(size=(14, ))
+            sub_agent_obs.append(sub_obs)
+        return sub_agent_obs
+
+    def step(self, actions):
+        """
+        # self.agent_num设定为2个智能体时，actions的输入为一个2纬的list，每个list里面为一个shape = (self.action_dim, )的动作数据
+        # 默认参数情况下，输入为一个list，里面含有两个元素，因为动作纬度为5，所里每个元素shape = (5, )
+        """
+        sub_agent_obs = []
+        sub_agent_reward = []
+        sub_agent_done = []
+        sub_agent_info = []
+        for i in range(self.agent_num):
+            sub_agent_obs.append(np.random.random(size=(14,)))
+            sub_agent_reward.append([np.random.rand()])
+            sub_agent_done.append(False)
+            sub_agent_info.append({})
+
+        return [sub_agent_obs, sub_agent_reward, sub_agent_done, sub_agent_info]
\ No newline at end of file
--- a/envs/env_wrappers.py
+++ b/envs/env_wrappers.py
@@ -9,6 +9,7 @@ Modified from OpenAI Baselines code to work with multi-agent envs
 import numpy as np
 import gym
 from gym import spaces
+from envs.env import Env


 class MultiDiscrete(gym.Space):
@@ -56,43 +57,6 @@ class MultiDiscrete(gym.Space):
        return np.array_equal(self.low, other.low) and np.array_equal(self.high, other.high)


-class Env(object):
-    """
-    # 环境中的智能体
-    """
-    def __init__(self, i):
-        self.agent_num = 2  # 设置智能体(小飞机)的个数，这里设置为两个
-        self.obs_dim = 14  # 设置智能体的观测纬度
-        self.action_dim = 5  # 设置智能体的动作纬度，这里假定为一个五个纬度的
-
-    def reset(self):
-        """
-        # self.agent_num设定为2个智能体时，返回值为一个list，每个list里面为一个shape = (self.obs_dim, )的观测数据
-        """
-        sub_agent_obs = []
-        for i in range(self.agent_num):
-            sub_obs = np.random.random(size=(14, ))
-            sub_agent_obs.append(sub_obs)
-        return sub_agent_obs
-
-    def step(self, actions):
-        """
-        # self.agent_num设定为2个智能体时，actions的输入为一个2纬的list，每个list里面为一个shape = (self.action_dim, )的动作数据
-        # 默认参数情况下，输入为一个list，里面含有两个元素，因为动作纬度为5，所里每个元素shape = (5, )
-        """
-        sub_agent_obs = []
-        sub_agent_reward = []
-        sub_agent_done = []
-        sub_agent_info = []
-        for i in range(self.agent_num):
-            sub_agent_obs.append(np.random.random(size=(14,)))
-            sub_agent_reward.append([np.random.rand()])
-            sub_agent_done.append(False)
-            sub_agent_info.append({})
-
-        return [sub_agent_obs, sub_agent_reward, sub_agent_done, sub_agent_info]
-
-
 class SubprocVecEnv(object):
    def __init__(self, all_args):
        """