adds environments using robosim and grsim

jgocm · Oct 31, 2020 · 036a5b2 · 036a5b2
2 parents 6a4c337 + 8792995
commit 036a5b2
Show file tree

Hide file tree

Showing 192 changed files with 3,670 additions and 58 deletions.
diff --git a/.gitignore b/.gitignore
@@ -1,3 +1,14 @@
+.DS_Store
+*.pyc
+rc_gym.egg-info/
+pb/*
+.vscode/*
+*_pb2.py
+__pycache__
+.idea/
+*.0
+runs/*
+agents/agentShootGoalie/rlAdventure2DDPG/runs/*
 # Byte-compiled / optimized / DLL files
 __pycache__/
 *.py[cod]
@@ -135,3 +146,6 @@ dmypy.json
 
 # Cython debug symbols
 cython_debug/
+
+# VSCode
+.vscode/
diff --git a/README.md b/README.md
@@ -1,60 +1,8 @@
-# RoboCup Very Small Size League Gym Environment
-This Environment is used in [RobôCIn's](https://github.com/robocin/deepvss) project. Check for some Reinforcement Learning Techniques applied for the environment. 
-
-## Project based on:
-* [VSS-SDK/VSS-Simulator & VSS-Viewer](https://github.com/VSS-SDK/VSS-Simulator) (x64 binaries provided here)
-* [OpenAI Gym Environments](https://github.com/openai/gym)
-
-# Requirements
-
-- FIRASim
-    - Clone the repo
-        - https://github.com/robocin/FIRASim/releases/tag/deep_train
-    - Follow it's install guide
-        - https://github.com/robocin/FIRASim/blob/master/INSTALL.md
-    - Once builded, change the binary file in gym_vss/binaries_envs/fira_sim/bin
-
-- VSS SDK
-    - Add the following line to your ~/.bashrc or ~/.bash_profile
-    - source /home/$USER/path/to/envs/gym_vss/binaries_envs/vss_sdk/exportlibs
-
-FIRASim requires much more and heavy libs linked than SDK, that's why we couldn't do as in SDK guide.
-
-# Install
-First change the 5th line of gym_vss/gym_real_soccer/comm/Makefile to your python include path.
-If you are using anaconda, you need to change only the python version in the path.
-```bash
-$ sudo apt-get install swig freeglut3-dev -y
-$ cd gym_vss/gym_real_soccer/comm
-$ make
-$ cd ../../../
-$ pip install -e .
-```
-
-OBS: If you will use only the simulated environment, do:
-- comment line 3 in gym_vss/__init__.py
-- pip install -e .
-
-# Example of agent
-```python
-import gym
-import gym_vss
-
-from gym_vss import SingleAgentSoccerEnvWrapper
-
-
-env = gym.make('vss_soccer_cont-v0')
-# env = SingleAgentSoccerEnvWrapper(env, simulator='sdk')
-# If you want FIRASim
-env = SingleAgentSoccerEnvWrapper(env, simulator='fira')
-env.reset()
-for i in range(1):
-    done = False
-    state = env.reset()
-    while not done:
-        action = env.action_space.sample()
-        next_state, reward, done, _ = env.step(action)
-env.close()
-```
+# Robocin Environments for Reinforcement Learning
 
+- deepvss
+    - environment to our team using FIRASim
 
+- envs
+    - environment for vss using RoboSim
+    - environment for SSL using GRSim
diff --git a/deepvss/README.md b/deepvss/README.md
@@ -0,0 +1,60 @@
+# RoboCup Very Small Size League Gym Environment
+This Environment is used in [RobôCIn's](https://github.com/robocin/deepvss) project. Check for some Reinforcement Learning Techniques applied for the environment. 
+
+## Project based on:
+* [VSS-SDK/VSS-Simulator & VSS-Viewer](https://github.com/VSS-SDK/VSS-Simulator) (x64 binaries provided here)
+* [OpenAI Gym Environments](https://github.com/openai/gym)
+
+# Requirements
+
+- FIRASim
+    - Clone the repo
+        - https://github.com/robocin/FIRASim/releases/tag/deep_train
+    - Follow it's install guide
+        - https://github.com/robocin/FIRASim/blob/master/INSTALL.md
+    - Once builded, change the binary file in gym_vss/binaries_envs/fira_sim/bin
+
+- VSS SDK
+    - Add the following line to your ~/.bashrc or ~/.bash_profile
+    - source /home/$USER/path/to/envs/gym_vss/binaries_envs/vss_sdk/exportlibs
+
+FIRASim requires much more and heavy libs linked than SDK, that's why we couldn't do as in SDK guide.
+
+# Install
+First change the 5th line of gym_vss/gym_real_soccer/comm/Makefile to your python include path.
+If you are using anaconda, you need to change only the python version in the path.
+```bash
+$ sudo apt-get install swig freeglut3-dev -y
+$ cd gym_vss/gym_real_soccer/comm
+$ make
+$ cd ../../../
+$ pip install -e .
+```
+
+OBS: If you will use only the simulated environment, do:
+- comment line 3 in gym_vss/__init__.py
+- pip install -e .
+
+# Example of agent
+```python
+import gym
+import gym_vss
+
+from gym_vss import SingleAgentSoccerEnvWrapper
+
+
+env = gym.make('vss_soccer_cont-v0')
+# env = SingleAgentSoccerEnvWrapper(env, simulator='sdk')
+# If you want FIRASim
+env = SingleAgentSoccerEnvWrapper(env, simulator='fira')
+env.reset()
+for i in range(1):
+    done = False
+    state = env.reset()
+    while not done:
+        action = env.action_space.sample()
+        next_state, reward, done, _ = env.step(action)
+env.close()
+```
+
+
diff --git a/examples/basic.py → deepvss/examples/basic.py b/examples/basic.py → deepvss/examples/basic.py
diff --git a/gym_vss/__init__.py → deepvss/gym_vss/__init__.py b/gym_vss/__init__.py → deepvss/gym_vss/__init__.py
diff --git a/gym_vss/binaries_envs/fira_sim/bin/FIRASim → ...ym_vss/binaries_envs/fira_sim/bin/FIRASim b/gym_vss/binaries_envs/fira_sim/bin/FIRASim → ...ym_vss/binaries_envs/fira_sim/bin/FIRASim
diff --git a/...binaries_envs/fira_sim/config/Parsian.ini → ...binaries_envs/fira_sim/config/Parsian.ini b/...binaries_envs/fira_sim/config/Parsian.ini → ...binaries_envs/fira_sim/config/Parsian.ini
diff --git a/...aries_envs/fira_sim/config/ParsianNew.ini → ...aries_envs/fira_sim/config/ParsianNew.ini b/...aries_envs/fira_sim/config/ParsianNew.ini → ...aries_envs/fira_sim/config/ParsianNew.ini
diff --git a/...binaries_envs/fira_sim/config/RoboCIn.ini → ...binaries_envs/fira_sim/config/RoboCIn.ini b/...binaries_envs/fira_sim/config/RoboCIn.ini → ...binaries_envs/fira_sim/config/RoboCIn.ini
diff --git a/...ries_envs/fira_sim/config/RoboIME2012.ini → ...ries_envs/fira_sim/config/RoboIME2012.ini b/...ries_envs/fira_sim/config/RoboIME2012.ini → ...ries_envs/fira_sim/config/RoboIME2012.ini
diff --git a/..._envs/fira_sim/formation/normal.formation → ..._envs/fira_sim/formation/normal.formation b/..._envs/fira_sim/formation/normal.formation → ..._envs/fira_sim/formation/normal.formation
diff --git a/...ies_envs/fira_sim/resources/grsim.desktop → ...ies_envs/fira_sim/resources/grsim.desktop b/...ies_envs/fira_sim/resources/grsim.desktop → ...ies_envs/fira_sim/resources/grsim.desktop
diff --git a/...binaries_envs/fira_sim/resources/grsim.rc → ...binaries_envs/fira_sim/resources/grsim.rc b/...binaries_envs/fira_sim/resources/grsim.rc → ...binaries_envs/fira_sim/resources/grsim.rc
diff --git a/..._envs/fira_sim/resources/icons/grsim.icns → ..._envs/fira_sim/resources/icons/grsim.icns b/..._envs/fira_sim/resources/icons/grsim.icns → ..._envs/fira_sim/resources/icons/grsim.icns
diff --git a/...s_envs/fira_sim/resources/icons/grsim.ico → ...s_envs/fira_sim/resources/icons/grsim.ico b/...s_envs/fira_sim/resources/icons/grsim.ico → ...s_envs/fira_sim/resources/icons/grsim.ico
diff --git a/...s_envs/fira_sim/resources/icons/grsim.svg → ...s_envs/fira_sim/resources/icons/grsim.svg b/...s_envs/fira_sim/resources/icons/grsim.svg → ...s_envs/fira_sim/resources/icons/grsim.svg
diff --git a/...ries_envs/fira_sim/resources/textures.qrc → ...ries_envs/fira_sim/resources/textures.qrc b/...ries_envs/fira_sim/resources/textures.qrc → ...ries_envs/fira_sim/resources/textures.qrc
diff --git a/...s_envs/fira_sim/resources/textures/b0.png → ...s_envs/fira_sim/resources/textures/b0.png b/...s_envs/fira_sim/resources/textures/b0.png → ...s_envs/fira_sim/resources/textures/b0.png
diff --git a/...s_envs/fira_sim/resources/textures/b1.png → ...s_envs/fira_sim/resources/textures/b1.png b/...s_envs/fira_sim/resources/textures/b1.png → ...s_envs/fira_sim/resources/textures/b1.png
diff --git a/..._envs/fira_sim/resources/textures/b10.png → ..._envs/fira_sim/resources/textures/b10.png b/..._envs/fira_sim/resources/textures/b10.png → ..._envs/fira_sim/resources/textures/b10.png
diff --git a/..._envs/fira_sim/resources/textures/b11.png → ..._envs/fira_sim/resources/textures/b11.png b/..._envs/fira_sim/resources/textures/b11.png → ..._envs/fira_sim/resources/textures/b11.png
diff --git a/...s_envs/fira_sim/resources/textures/b2.png → ...s_envs/fira_sim/resources/textures/b2.png b/...s_envs/fira_sim/resources/textures/b2.png → ...s_envs/fira_sim/resources/textures/b2.png
diff --git a/...s_envs/fira_sim/resources/textures/b3.png → ...s_envs/fira_sim/resources/textures/b3.png b/...s_envs/fira_sim/resources/textures/b3.png → ...s_envs/fira_sim/resources/textures/b3.png
diff --git a/...s_envs/fira_sim/resources/textures/b4.png → ...s_envs/fira_sim/resources/textures/b4.png b/...s_envs/fira_sim/resources/textures/b4.png → ...s_envs/fira_sim/resources/textures/b4.png
diff --git a/...s_envs/fira_sim/resources/textures/b5.png → ...s_envs/fira_sim/resources/textures/b5.png b/...s_envs/fira_sim/resources/textures/b5.png → ...s_envs/fira_sim/resources/textures/b5.png
diff --git a/...s_envs/fira_sim/resources/textures/b6.png → ...s_envs/fira_sim/resources/textures/b6.png b/...s_envs/fira_sim/resources/textures/b6.png → ...s_envs/fira_sim/resources/textures/b6.png
diff --git a/...s_envs/fira_sim/resources/textures/b7.png → ...s_envs/fira_sim/resources/textures/b7.png b/...s_envs/fira_sim/resources/textures/b7.png → ...s_envs/fira_sim/resources/textures/b7.png
diff --git a/...s_envs/fira_sim/resources/textures/b8.png → ...s_envs/fira_sim/resources/textures/b8.png b/...s_envs/fira_sim/resources/textures/b8.png → ...s_envs/fira_sim/resources/textures/b8.png
diff --git a/...s_envs/fira_sim/resources/textures/b9.png → ...s_envs/fira_sim/resources/textures/b9.png b/...s_envs/fira_sim/resources/textures/b9.png → ...s_envs/fira_sim/resources/textures/b9.png
diff --git a/...nvs/fira_sim/resources/textures/grass.png → ...nvs/fira_sim/resources/textures/grass.png b/...nvs/fira_sim/resources/textures/grass.png → ...nvs/fira_sim/resources/textures/grass.png
diff --git a/...s_envs/fira_sim/resources/textures/qt.png → ...s_envs/fira_sim/resources/textures/qt.png b/...s_envs/fira_sim/resources/textures/qt.png → ...s_envs/fira_sim/resources/textures/qt.png
diff --git a/...ources/textures/sky/arabian_nights_bk.png → ...ources/textures/sky/arabian_nights_bk.png b/...ources/textures/sky/arabian_nights_bk.png → ...ources/textures/sky/arabian_nights_bk.png
diff --git a/...ources/textures/sky/arabian_nights_dn.png → ...ources/textures/sky/arabian_nights_dn.png b/...ources/textures/sky/arabian_nights_dn.png → ...ources/textures/sky/arabian_nights_dn.png
diff --git a/...ources/textures/sky/arabian_nights_ft.png → ...ources/textures/sky/arabian_nights_ft.png b/...ources/textures/sky/arabian_nights_ft.png → ...ources/textures/sky/arabian_nights_ft.png
diff --git a/...ources/textures/sky/arabian_nights_lf.png → ...ources/textures/sky/arabian_nights_lf.png b/...ources/textures/sky/arabian_nights_lf.png → ...ources/textures/sky/arabian_nights_lf.png
diff --git a/...ources/textures/sky/arabian_nights_rt.png → ...ources/textures/sky/arabian_nights_rt.png b/...ources/textures/sky/arabian_nights_rt.png → ...ources/textures/sky/arabian_nights_rt.png
diff --git a/...ources/textures/sky/arabian_nights_up.png → ...ources/textures/sky/arabian_nights_up.png b/...ources/textures/sky/arabian_nights_up.png → ...ources/textures/sky/arabian_nights_up.png
diff --git a/...nvs/fira_sim/resources/textures/wheel.png → ...nvs/fira_sim/resources/textures/wheel.png b/...nvs/fira_sim/resources/textures/wheel.png → ...nvs/fira_sim/resources/textures/wheel.png
diff --git a/...s_envs/fira_sim/resources/textures/y0.png → ...s_envs/fira_sim/resources/textures/y0.png b/...s_envs/fira_sim/resources/textures/y0.png → ...s_envs/fira_sim/resources/textures/y0.png
diff --git a/...s_envs/fira_sim/resources/textures/y1.png → ...s_envs/fira_sim/resources/textures/y1.png b/...s_envs/fira_sim/resources/textures/y1.png → ...s_envs/fira_sim/resources/textures/y1.png
diff --git a/..._envs/fira_sim/resources/textures/y10.png → ..._envs/fira_sim/resources/textures/y10.png b/..._envs/fira_sim/resources/textures/y10.png → ..._envs/fira_sim/resources/textures/y10.png
diff --git a/..._envs/fira_sim/resources/textures/y11.png → ..._envs/fira_sim/resources/textures/y11.png b/..._envs/fira_sim/resources/textures/y11.png → ..._envs/fira_sim/resources/textures/y11.png
diff --git a/...s_envs/fira_sim/resources/textures/y2.png → ...s_envs/fira_sim/resources/textures/y2.png b/...s_envs/fira_sim/resources/textures/y2.png → ...s_envs/fira_sim/resources/textures/y2.png
diff --git a/...s_envs/fira_sim/resources/textures/y3.png → ...s_envs/fira_sim/resources/textures/y3.png b/...s_envs/fira_sim/resources/textures/y3.png → ...s_envs/fira_sim/resources/textures/y3.png
diff --git a/...s_envs/fira_sim/resources/textures/y4.png → ...s_envs/fira_sim/resources/textures/y4.png b/...s_envs/fira_sim/resources/textures/y4.png → ...s_envs/fira_sim/resources/textures/y4.png
diff --git a/...s_envs/fira_sim/resources/textures/y5.png → ...s_envs/fira_sim/resources/textures/y5.png b/...s_envs/fira_sim/resources/textures/y5.png → ...s_envs/fira_sim/resources/textures/y5.png
diff --git a/...s_envs/fira_sim/resources/textures/y6.png → ...s_envs/fira_sim/resources/textures/y6.png b/...s_envs/fira_sim/resources/textures/y6.png → ...s_envs/fira_sim/resources/textures/y6.png
diff --git a/...s_envs/fira_sim/resources/textures/y7.png → ...s_envs/fira_sim/resources/textures/y7.png b/...s_envs/fira_sim/resources/textures/y7.png → ...s_envs/fira_sim/resources/textures/y7.png
diff --git a/...s_envs/fira_sim/resources/textures/y8.png → ...s_envs/fira_sim/resources/textures/y8.png b/...s_envs/fira_sim/resources/textures/y8.png → ...s_envs/fira_sim/resources/textures/y8.png
diff --git a/...s_envs/fira_sim/resources/textures/y9.png → ...s_envs/fira_sim/resources/textures/y9.png b/...s_envs/fira_sim/resources/textures/y9.png → ...s_envs/fira_sim/resources/textures/y9.png
diff --git a/...inaries_envs/vss_sdk/VSS-SimulatorBasePos → ...inaries_envs/vss_sdk/VSS-SimulatorBasePos b/...inaries_envs/vss_sdk/VSS-SimulatorBasePos → ...inaries_envs/vss_sdk/VSS-SimulatorBasePos
diff --git a/gym_vss/binaries_envs/vss_sdk/VSS-SimulatorF → ..._vss/binaries_envs/vss_sdk/VSS-SimulatorF b/gym_vss/binaries_envs/vss_sdk/VSS-SimulatorF → ..._vss/binaries_envs/vss_sdk/VSS-SimulatorF
diff --git a/...vss/binaries_envs/vss_sdk/VSS-SimulatorGK → ...vss/binaries_envs/vss_sdk/VSS-SimulatorGK b/...vss/binaries_envs/vss_sdk/VSS-SimulatorGK → ...vss/binaries_envs/vss_sdk/VSS-SimulatorGK
diff --git a/gym_vss/binaries_envs/vss_sdk/VSS-SimulatorI → ..._vss/binaries_envs/vss_sdk/VSS-SimulatorI b/gym_vss/binaries_envs/vss_sdk/VSS-SimulatorI → ..._vss/binaries_envs/vss_sdk/VSS-SimulatorI
diff --git a/...naries_envs/vss_sdk/VSS-SimulatorOneAgent → ...naries_envs/vss_sdk/VSS-SimulatorOneAgent b/...naries_envs/vss_sdk/VSS-SimulatorOneAgent → ...naries_envs/vss_sdk/VSS-SimulatorOneAgent
diff --git a/...s/binaries_envs/vss_sdk/VSS-SimulatorSync → ...s/binaries_envs/vss_sdk/VSS-SimulatorSync b/...s/binaries_envs/vss_sdk/VSS-SimulatorSync → ...s/binaries_envs/vss_sdk/VSS-SimulatorSync
diff --git a/gym_vss/binaries_envs/vss_sdk/VSS-Viewer → .../gym_vss/binaries_envs/vss_sdk/VSS-Viewer b/gym_vss/binaries_envs/vss_sdk/VSS-Viewer → .../gym_vss/binaries_envs/vss_sdk/VSS-Viewer
diff --git a/gym_vss/binaries_envs/vss_sdk/exportlibs → .../gym_vss/binaries_envs/vss_sdk/exportlibs b/gym_vss/binaries_envs/vss_sdk/exportlibs → .../gym_vss/binaries_envs/vss_sdk/exportlibs
diff --git a/...dk/lib/libboost_program_options.so.1.54.0 → ...dk/lib/libboost_program_options.so.1.54.0 b/...dk/lib/libboost_program_options.so.1.54.0 → ...dk/lib/libboost_program_options.so.1.54.0
diff --git a/...binaries_envs/vss_sdk/lib/libpgm-5.1.so.0 → ...binaries_envs/vss_sdk/lib/libpgm-5.1.so.0 b/...binaries_envs/vss_sdk/lib/libpgm-5.1.so.0 → ...binaries_envs/vss_sdk/lib/libpgm-5.1.so.0
diff --git a/...inaries_envs/vss_sdk/lib/libprotobuf.so.8 → ...inaries_envs/vss_sdk/lib/libprotobuf.so.8 b/...inaries_envs/vss_sdk/lib/libprotobuf.so.8 → ...inaries_envs/vss_sdk/lib/libprotobuf.so.8
diff --git a/...vss/binaries_envs/vss_sdk/lib/libzmq.so.3 → ...vss/binaries_envs/vss_sdk/lib/libzmq.so.3 b/...vss/binaries_envs/vss_sdk/lib/libzmq.so.3 → ...vss/binaries_envs/vss_sdk/lib/libzmq.so.3
diff --git a/gym_vss/binaries_envs/vss_sdk/vss-simulator → ...m_vss/binaries_envs/vss_sdk/vss-simulator b/gym_vss/binaries_envs/vss_sdk/vss-simulator → ...m_vss/binaries_envs/vss_sdk/vss-simulator
diff --git a/gym_vss/ctrl/__init__.py → deepvss/gym_vss/ctrl/__init__.py b/gym_vss/ctrl/__init__.py → deepvss/gym_vss/ctrl/__init__.py
diff --git a/gym_vss/ctrl/ctrl_model.py → deepvss/gym_vss/ctrl/ctrl_model.py b/gym_vss/ctrl/ctrl_model.py → deepvss/gym_vss/ctrl/ctrl_model.py
diff --git a/...vss/ctrl/data/collected/.~lock.teste.csv# → ...vss/ctrl/data/collected/.~lock.teste.csv# b/...vss/ctrl/data/collected/.~lock.teste.csv# → ...vss/ctrl/data/collected/.~lock.teste.csv#
diff --git a/.../ctrl/data/collected/2019-08-29/Robot.txt → .../ctrl/data/collected/2019-08-29/Robot.txt b/.../ctrl/data/collected/2019-08-29/Robot.txt → .../ctrl/data/collected/2019-08-29/Robot.txt
diff --git a/...ctrl/data/collected/2019-08-29/Robot.txt~ → ...ctrl/data/collected/2019-08-29/Robot.txt~ b/...ctrl/data/collected/2019-08-29/Robot.txt~ → ...ctrl/data/collected/2019-08-29/Robot.txt~
diff --git a/...l/data/collected/2019-08-29/full_all.csv~ → ...l/data/collected/2019-08-29/full_all.csv~ b/...l/data/collected/2019-08-29/full_all.csv~ → ...l/data/collected/2019-08-29/full_all.csv~
diff --git a/...cessed/.~lock.log_simulado_corrected.csv# → ...cessed/.~lock.log_simulado_corrected.csv# b/...cessed/.~lock.log_simulado_corrected.csv# → ...cessed/.~lock.log_simulado_corrected.csv#
diff --git a/gym_vss/ctrl/models/ctrl_model0.cpth → deepvss/gym_vss/ctrl/models/ctrl_model0.cpth b/gym_vss/ctrl/models/ctrl_model0.cpth → deepvss/gym_vss/ctrl/models/ctrl_model0.cpth
diff --git a/...vss/ctrl/models/ctrl_model_deslocado.cpth → ...vss/ctrl/models/ctrl_model_deslocado.cpth b/...vss/ctrl/models/ctrl_model_deslocado.cpth → ...vss/ctrl/models/ctrl_model_deslocado.cpth
diff --git a/gym_vss/ctrl/models/ctrl_model_first.cpth → ...gym_vss/ctrl/models/ctrl_model_first.cpth b/gym_vss/ctrl/models/ctrl_model_first.cpth → ...gym_vss/ctrl/models/ctrl_model_first.cpth
diff --git a/...rl/models/ctrl_model_motor_deslocado.cpth → ...rl/models/ctrl_model_motor_deslocado.cpth b/...rl/models/ctrl_model_motor_deslocado.cpth → ...rl/models/ctrl_model_motor_deslocado.cpth
diff --git a/...vss/ctrl/models/ctrl_model_nomelouco.cpth → ...vss/ctrl/models/ctrl_model_nomelouco.cpth b/...vss/ctrl/models/ctrl_model_nomelouco.cpth → ...vss/ctrl/models/ctrl_model_nomelouco.cpth
diff --git a/.../models/ctrl_model_until_convergence.cpth → .../models/ctrl_model_until_convergence.cpth b/.../models/ctrl_model_until_convergence.cpth → .../models/ctrl_model_until_convergence.cpth
diff --git a/gym_vss/ctrl/models/ff_log_default_6.cpth → ...gym_vss/ctrl/models/ff_log_default_6.cpth b/gym_vss/ctrl/models/ff_log_default_6.cpth → ...gym_vss/ctrl/models/ff_log_default_6.cpth
diff --git a/gym_vss/ctrl/models/ff_log_full_4.cpth → ...ss/gym_vss/ctrl/models/ff_log_full_4.cpth b/gym_vss/ctrl/models/ff_log_full_4.cpth → ...ss/gym_vss/ctrl/models/ff_log_full_4.cpth
diff --git a/gym_vss/ctrl/models/ff_log_full_6.cpth → ...ss/gym_vss/ctrl/models/ff_log_full_6.cpth b/gym_vss/ctrl/models/ff_log_full_6.cpth → ...ss/gym_vss/ctrl/models/ff_log_full_6.cpth
diff --git a/gym_vss/ctrl/models/ff_log_full_7.cpth → ...ss/gym_vss/ctrl/models/ff_log_full_7.cpth b/gym_vss/ctrl/models/ff_log_full_7.cpth → ...ss/gym_vss/ctrl/models/ff_log_full_7.cpth
diff --git a/gym_vss/ctrl/models/ff_log_spline_5.cpth → .../gym_vss/ctrl/models/ff_log_spline_5.cpth b/gym_vss/ctrl/models/ff_log_spline_5.cpth → .../gym_vss/ctrl/models/ff_log_spline_5.cpth
diff --git a/gym_vss/ctrl/train_control.py → deepvss/gym_vss/ctrl/train_control.py b/gym_vss/ctrl/train_control.py → deepvss/gym_vss/ctrl/train_control.py
diff --git a/gym_vss/gym_real_soccer/PIDControl.py → ...vss/gym_vss/gym_real_soccer/PIDControl.py b/gym_vss/gym_real_soccer/PIDControl.py → ...vss/gym_vss/gym_real_soccer/PIDControl.py
diff --git a/gym_vss/gym_real_soccer/__init__.py → deepvss/gym_vss/gym_real_soccer/__init__.py b/gym_vss/gym_real_soccer/__init__.py → deepvss/gym_vss/gym_real_soccer/__init__.py
diff --git a/gym_vss/gym_real_soccer/action_manager.py → ...gym_vss/gym_real_soccer/action_manager.py b/gym_vss/gym_real_soccer/action_manager.py → ...gym_vss/gym_real_soccer/action_manager.py
diff --git a/gym_vss/gym_real_soccer/comm/Makefile → ...vss/gym_vss/gym_real_soccer/comm/Makefile b/gym_vss/gym_real_soccer/comm/Makefile → ...vss/gym_vss/gym_real_soccer/comm/Makefile
diff --git a/gym_vss/gym_real_soccer/comm/nrf.cpp → deepvss/gym_vss/gym_real_soccer/comm/nrf.cpp b/gym_vss/gym_real_soccer/comm/nrf.cpp → deepvss/gym_vss/gym_real_soccer/comm/nrf.cpp
diff --git a/gym_vss/gym_real_soccer/comm/nrf.h → deepvss/gym_vss/gym_real_soccer/comm/nrf.h b/gym_vss/gym_real_soccer/comm/nrf.h → deepvss/gym_vss/gym_real_soccer/comm/nrf.h
diff --git a/gym_vss/gym_real_soccer/comm/nrf.i → deepvss/gym_vss/gym_real_soccer/comm/nrf.i b/gym_vss/gym_real_soccer/comm/nrf.i → deepvss/gym_vss/gym_real_soccer/comm/nrf.i
diff --git a/gym_vss/gym_real_soccer/comm/nrf.o → deepvss/gym_vss/gym_real_soccer/comm/nrf.o b/gym_vss/gym_real_soccer/comm/nrf.o → deepvss/gym_vss/gym_real_soccer/comm/nrf.o
diff --git a/gym_vss/gym_real_soccer/comm/nrf.py → deepvss/gym_vss/gym_real_soccer/comm/nrf.py b/gym_vss/gym_real_soccer/comm/nrf.py → deepvss/gym_vss/gym_real_soccer/comm/nrf.py
diff --git a/...ym_real_soccer/comm/nrf_Communication.cpp → ...ym_real_soccer/comm/nrf_Communication.cpp b/...ym_real_soccer/comm/nrf_Communication.cpp → ...ym_real_soccer/comm/nrf_Communication.cpp
diff --git a/.../gym_real_soccer/comm/nrf_Communication.h → .../gym_real_soccer/comm/nrf_Communication.h b/.../gym_real_soccer/comm/nrf_Communication.h → .../gym_real_soccer/comm/nrf_Communication.h
diff --git a/.../gym_real_soccer/comm/nrf_Communication.i → .../gym_real_soccer/comm/nrf_Communication.i b/.../gym_real_soccer/comm/nrf_Communication.i → .../gym_real_soccer/comm/nrf_Communication.i
diff --git a/.../gym_real_soccer/comm/nrf_Communication.o → .../gym_real_soccer/comm/nrf_Communication.o b/.../gym_real_soccer/comm/nrf_Communication.o → .../gym_real_soccer/comm/nrf_Communication.o
diff --git a/...gym_real_soccer/comm/nrf_Communication.py → ...gym_real_soccer/comm/nrf_Communication.py b/...gym_real_soccer/comm/nrf_Communication.py → ...gym_real_soccer/comm/nrf_Communication.py
diff --git a/...al_soccer/comm/nrf_Communication_wrap.cxx → ...al_soccer/comm/nrf_Communication_wrap.cxx b/...al_soccer/comm/nrf_Communication_wrap.cxx → ...al_soccer/comm/nrf_Communication_wrap.cxx
diff --git a/...real_soccer/comm/nrf_Communication_wrap.o → ...real_soccer/comm/nrf_Communication_wrap.o b/...real_soccer/comm/nrf_Communication_wrap.o → ...real_soccer/comm/nrf_Communication_wrap.o
diff --git a/gym_vss/gym_real_soccer/comm/nrf_wrap.cxx → ...gym_vss/gym_real_soccer/comm/nrf_wrap.cxx b/gym_vss/gym_real_soccer/comm/nrf_wrap.cxx → ...gym_vss/gym_real_soccer/comm/nrf_wrap.cxx
diff --git a/gym_vss/gym_real_soccer/comm/nrf_wrap.o → ...s/gym_vss/gym_real_soccer/comm/nrf_wrap.o b/gym_vss/gym_real_soccer/comm/nrf_wrap.o → ...s/gym_vss/gym_real_soccer/comm/nrf_wrap.o
diff --git a/...s/gym_real_soccer/comm/updateUdevRules.sh → ...s/gym_real_soccer/comm/updateUdevRules.sh b/...s/gym_real_soccer/comm/updateUdevRules.sh → ...s/gym_real_soccer/comm/updateUdevRules.sh
diff --git a/gym_vss/gym_real_soccer/kalman_filter_2d.py → ...m_vss/gym_real_soccer/kalman_filter_2d.py b/gym_vss/gym_real_soccer/kalman_filter_2d.py → ...m_vss/gym_real_soccer/kalman_filter_2d.py
diff --git a/gym_vss/gym_real_soccer/kalman_parser.py → .../gym_vss/gym_real_soccer/kalman_parser.py b/gym_vss/gym_real_soccer/kalman_parser.py → .../gym_vss/gym_real_soccer/kalman_parser.py
diff --git a/gym_vss/gym_real_soccer/nrfparser.py → deepvss/gym_vss/gym_real_soccer/nrfparser.py b/gym_vss/gym_real_soccer/nrfparser.py → deepvss/gym_vss/gym_real_soccer/nrfparser.py
diff --git a/...vss/gym_real_soccer/proto_state_models.py → ...vss/gym_real_soccer/proto_state_models.py b/...vss/gym_real_soccer/proto_state_models.py → ...vss/gym_real_soccer/proto_state_models.py
diff --git a/gym_vss/gym_real_soccer/sslparser.py → deepvss/gym_vss/gym_real_soccer/sslparser.py b/gym_vss/gym_real_soccer/sslparser.py → deepvss/gym_vss/gym_real_soccer/sslparser.py
diff --git a/gym_vss/gym_real_soccer/test_nrf.py → deepvss/gym_vss/gym_real_soccer/test_nrf.py b/gym_vss/gym_real_soccer/test_nrf.py → deepvss/gym_vss/gym_real_soccer/test_nrf.py
diff --git a/gym_vss/gym_real_soccer/vss_soccer_real.py → ...ym_vss/gym_real_soccer/vss_soccer_real.py b/gym_vss/gym_real_soccer/vss_soccer_real.py → ...ym_vss/gym_real_soccer/vss_soccer_real.py
diff --git a/...real_soccer/vss_soccer_real_continuous.py → ...real_soccer/vss_soccer_real_continuous.py b/...real_soccer/vss_soccer_real_continuous.py → ...real_soccer/vss_soccer_real_continuous.py
diff --git a/gym_vss/gym_real_soccer/vssclient.py → deepvss/gym_vss/gym_real_soccer/vssclient.py b/gym_vss/gym_real_soccer/vssclient.py → deepvss/gym_vss/gym_real_soccer/vssclient.py
diff --git a/gym_vss/gym_real_soccer/vssparser.py → deepvss/gym_vss/gym_real_soccer/vssparser.py b/gym_vss/gym_real_soccer/vssparser.py → deepvss/gym_vss/gym_real_soccer/vssparser.py
diff --git a/gym_vss/gym_soccer/__init__.py → deepvss/gym_vss/gym_soccer/__init__.py b/gym_vss/gym_soccer/__init__.py → deepvss/gym_vss/gym_soccer/__init__.py
diff --git a/gym_vss/gym_soccer/command_pb2.py → deepvss/gym_vss/gym_soccer/command_pb2.py b/gym_vss/gym_soccer/command_pb2.py → deepvss/gym_vss/gym_soccer/command_pb2.py
diff --git a/gym_vss/gym_soccer/debug_pb2.py → deepvss/gym_vss/gym_soccer/debug_pb2.py b/gym_vss/gym_soccer/debug_pb2.py → deepvss/gym_vss/gym_soccer/debug_pb2.py
diff --git a/gym_vss/gym_soccer/fira_parser.py → deepvss/gym_vss/gym_soccer/fira_parser.py b/gym_vss/gym_soccer/fira_parser.py → deepvss/gym_vss/gym_soccer/fira_parser.py
diff --git a/gym_vss/gym_soccer/firaclient.py → deepvss/gym_vss/gym_soccer/firaclient.py b/gym_vss/gym_soccer/firaclient.py → deepvss/gym_vss/gym_soccer/firaclient.py
diff --git a/...ss/gym_soccer/pb_fira/command_fira_pb2.py → ...ss/gym_soccer/pb_fira/command_fira_pb2.py b/...ss/gym_soccer/pb_fira/command_fira_pb2.py → ...ss/gym_soccer/pb_fira/command_fira_pb2.py
diff --git a/gym_vss/gym_soccer/pb_fira/command_pb2.py → ...gym_vss/gym_soccer/pb_fira/command_pb2.py b/gym_vss/gym_soccer/pb_fira/command_pb2.py → ...gym_vss/gym_soccer/pb_fira/command_pb2.py
diff --git a/gym_vss/gym_soccer/pb_fira/common_pb2.py → .../gym_vss/gym_soccer/pb_fira/common_pb2.py b/gym_vss/gym_soccer/pb_fira/common_pb2.py → .../gym_vss/gym_soccer/pb_fira/common_pb2.py
diff --git a/gym_vss/gym_soccer/pb_fira/packet_pb2.py → .../gym_vss/gym_soccer/pb_fira/packet_pb2.py b/gym_vss/gym_soccer/pb_fira/packet_pb2.py → .../gym_vss/gym_soccer/pb_fira/packet_pb2.py
diff --git a/...m_soccer/pb_fira/proto/command_fira.proto → ...m_soccer/pb_fira/proto/command_fira.proto b/...m_soccer/pb_fira/proto/command_fira.proto → ...m_soccer/pb_fira/proto/command_fira.proto
diff --git a/...vss/gym_soccer/pb_fira/proto/common.proto → ...vss/gym_soccer/pb_fira/proto/common.proto b/...vss/gym_soccer/pb_fira/proto/common.proto → ...vss/gym_soccer/pb_fira/proto/common.proto
diff --git a/gym_vss/gym_soccer/pb_fira/proto/compile.sh → ...m_vss/gym_soccer/pb_fira/proto/compile.sh b/gym_vss/gym_soccer/pb_fira/proto/compile.sh → ...m_vss/gym_soccer/pb_fira/proto/compile.sh
diff --git a/...vss/gym_soccer/pb_fira/proto/packet.proto → ...vss/gym_soccer/pb_fira/proto/packet.proto b/...vss/gym_soccer/pb_fira/proto/packet.proto → ...vss/gym_soccer/pb_fira/proto/packet.proto
diff --git a/...ym_soccer/pb_fira/proto/replacement.proto → ...ym_soccer/pb_fira/proto/replacement.proto b/...ym_soccer/pb_fira/proto/replacement.proto → ...ym_soccer/pb_fira/proto/replacement.proto
diff --git a/...vss/gym_soccer/pb_fira/replacement_pb2.py → ...vss/gym_soccer/pb_fira/replacement_pb2.py b/...vss/gym_soccer/pb_fira/replacement_pb2.py → ...vss/gym_soccer/pb_fira/replacement_pb2.py
diff --git a/gym_vss/gym_soccer/sim_parser.py → deepvss/gym_vss/gym_soccer/sim_parser.py b/gym_vss/gym_soccer/sim_parser.py → deepvss/gym_vss/gym_soccer/sim_parser.py
diff --git a/gym_vss/gym_soccer/state_pb2.py → deepvss/gym_vss/gym_soccer/state_pb2.py b/gym_vss/gym_soccer/state_pb2.py → deepvss/gym_vss/gym_soccer/state_pb2.py
diff --git a/gym_vss/gym_soccer/vss_soccer_sim.py → deepvss/gym_vss/gym_soccer/vss_soccer_sim.py b/gym_vss/gym_soccer/vss_soccer_sim.py → deepvss/gym_vss/gym_soccer/vss_soccer_sim.py
diff --git a/...s/gym_soccer/vss_soccer_sim_continuous.py → ...s/gym_soccer/vss_soccer_sim_continuous.py b/...s/gym_soccer/vss_soccer_sim_continuous.py → ...s/gym_soccer/vss_soccer_sim_continuous.py
diff --git a/...ym_soccer/vss_soccer_sim_continuous_ma.py → ...ym_soccer/vss_soccer_sim_continuous_ma.py b/...ym_soccer/vss_soccer_sim_continuous_ma.py → ...ym_soccer/vss_soccer_sim_continuous_ma.py
diff --git a/gym_vss/multi_agent_soccer_env_wrapper.py → ...gym_vss/multi_agent_soccer_env_wrapper.py b/gym_vss/multi_agent_soccer_env_wrapper.py → ...gym_vss/multi_agent_soccer_env_wrapper.py
diff --git a/gym_vss/single_agent_soccer_env_wrapper.py → ...ym_vss/single_agent_soccer_env_wrapper.py b/gym_vss/single_agent_soccer_env_wrapper.py → ...ym_vss/single_agent_soccer_env_wrapper.py
diff --git a/gym_vss/speed_estimator.py → deepvss/gym_vss/speed_estimator.py b/gym_vss/speed_estimator.py → deepvss/gym_vss/speed_estimator.py
diff --git a/gym_vss/spline.py → deepvss/gym_vss/spline.py b/gym_vss/spline.py → deepvss/gym_vss/spline.py
diff --git a/gym_vss/utils.py → deepvss/gym_vss/utils.py b/gym_vss/utils.py → deepvss/gym_vss/utils.py
diff --git a/gym_vss/vss_player.py → deepvss/gym_vss/vss_player.py b/gym_vss/vss_player.py → deepvss/gym_vss/vss_player.py
diff --git a/gym_vss/vss_soccer.py → deepvss/gym_vss/vss_soccer.py b/gym_vss/vss_soccer.py → deepvss/gym_vss/vss_soccer.py
diff --git a/setup.py → deepvss/setup.py b/setup.py → deepvss/setup.py
diff --git a/envs/README.md b/envs/README.md
@@ -0,0 +1,59 @@
+# Robocup SSL OpenAi gym environments
+
+# Requirements
+## Compile protobuf files
+```bash
+$ sudo apt-get install libprotobuf-dev protobuf-compiler -y
+$ cd rc_gym/grsim_ssl/Communication/pb/proto
+$ protoc --python_out=../ *.proto
+```
+## Fix protobuf compiled files from relative reference to absolute
+On file **rc_gym/grsim_ssl/Communication/pb/messages_robocup_ssl_wrapper_pb2.py**:
+
+
+``` python
+'before:'
+15 - import messages_robocup_ssl_detection_pb2 as messages__robocup__ssl__detection__pb2
+16 - import messages_robocup_ssl_geometry_pb2 as messages__robocup__ssl__geometry__pb2
+
+'after:'
+15 + import rc_gym.grsim_ssl.Communication.pb.messages_robocup_ssl_detection_pb2 as messages__robocup__ssl__detection__pb2
+16 + import rc_gym.grsim_ssl.Communication.pb.messages_robocup_ssl_geometry_pb2 as messages__robocup__ssl__geometry__pb2
+```
+
+On file **rc_gym/grsim_ssl/Communication/pb/grSim_Packet_pb2.py**:
+
+``` python
+'before:'
+15 - import grSim_Commands_pb2 as grSim__Commands__pb2
+16 - import grSim_Replacement_pb2 as grSim__Replacement__pb2
+'after:'
+15 + import rc_gym.grsim_ssl.Communication.pb.grSim_Commands_pb2 as grSim__Commands__pb2
+16 + import rc_gym.grsim_ssl.Communication.pb.grSim_Replacement_pb2 as grSim__Replacement__pb2
+```
+## Install environments
+
+```bash
+$ pip install -e .
+```
+# Available Envs
+- **grSimSSLPenalty-v0**
+- **grSimSSLShootGoalie-v0**
+
+# Example code
+```python
+import gym
+import rc_gym
+
+# Using penalty env
+env = gym.make('grSimSSLPenalty-v0')
+
+env.reset()
+# Run for 1 episode and print reward at the end
+for i in range(1):
+    done = False
+    while not done:
+        action = env.action_space.sample()
+        next_state, reward, done, _ = env.step(action)
+    print(reward)
+```
diff --git a/envs/agents/Utils/Buffers.py b/envs/agents/Utils/Buffers.py
@@ -0,0 +1,58 @@
+import random
+import numpy as np
+
+class ReplayBuffer:
+    def __init__(self, capacity):
+        self.capacity = capacity
+        self.buffer = []
+        self.position = 0
+
+    def push(self, state, action, reward, next_state, done):
+        if len(self.buffer) < self.capacity:
+            self.buffer.append(None)
+        self.buffer[self.position] = (state, action, reward, next_state, done)
+        self.position = (self.position + 1) % self.capacity
+
+    def sample(self, batch_size):
+        batch = random.sample(self.buffer, batch_size)
+        state, action, reward, next_state, done = map(np.stack, zip(*batch))
+        return state, action, reward, next_state, done
+
+    def __len__(self):
+        return len(self.buffer)
+
+class AverageBuffer:
+    def __init__(self, capacity = 100):
+        self.capacity = capacity
+        self.buffer = []
+        self.index = 0
+
+    def push(self, goal):
+        if len(self.buffer) < self.capacity:
+            self.buffer.append(None)
+
+        self.buffer[self.index] = goal
+        self.index = (self.index + 1) % self.capacity
+
+    def average(self):
+        return np.mean(self.buffer if len(self.buffer) > 0 else [0])
+
+    def state_dict(self):
+        buffer_dict = {}
+        buffer_dict['index'] = self.index
+        buffer_dict['bufferSize'] = len(self.buffer)
+
+        for i in range(len(self.buffer)):
+            buffer_dict[i] = self.buffer[i] 
+
+        return buffer_dict
+
+    def load_state_dict(self, buffer_dict):
+        self.index = buffer_dict['index']
+        size = buffer_dict['bufferSize']
+
+        for i in range(size):
+            self.buffer.append(buffer_dict[i])
+
+    def __len__(self):
+        return len(self.buffer)
diff --git a/envs/agents/Utils/Networks.py b/envs/agents/Utils/Networks.py
@@ -0,0 +1,46 @@
+import torch
+import torch.nn as nn
+import torch.nn.functional as F
+
+
+class ValueNetwork(nn.Module):
+    def __init__(self, num_inputs, num_actions, hidden_size, init_w=3e-3):
+        super(ValueNetwork, self).__init__()
+
+        self.linear1 = nn.Linear(num_inputs + num_actions, hidden_size)
+        self.linear2 = nn.Linear(hidden_size, hidden_size)
+        self.linear3 = nn.Linear(hidden_size, 1)
+
+        self.linear3.weight.data.uniform_(-init_w, init_w)
+        self.linear3.bias.data.uniform_(-init_w, init_w)
+
+    def forward(self, state, action):
+        x = torch.cat([state, action], 1)
+        x = F.relu(self.linear1(x))
+        x = F.relu(self.linear2(x))
+        x = self.linear3(x)
+        return x
+
+
+class PolicyNetwork(nn.Module):
+    def __init__(self, num_inputs, num_actions, hidden_size, device, init_w=3e-3):
+        super(PolicyNetwork, self).__init__()
+
+        self.linear1 = nn.Linear(num_inputs, hidden_size)
+        self.linear2 = nn.Linear(hidden_size, hidden_size)
+        self.linear3 = nn.Linear(hidden_size, num_actions)
+
+        self.linear3.weight.data.uniform_(-init_w, init_w)
+        self.linear3.bias.data.uniform_(-init_w, init_w)
+        self.device = device
+
+    def forward(self, state):
+        x = F.relu(self.linear1(state))
+        x = F.relu(self.linear2(x))
+        x = torch.tanh(self.linear3(x))
+        return x
+
+    def get_action(self, state):
+        state  = torch.FloatTensor(state).unsqueeze(0).to(self.device)
+        action = self.forward(state)
+        return action.detach().cpu().numpy()[0]
diff --git a/envs/agents/Utils/Normalization.py b/envs/agents/Utils/Normalization.py
@@ -0,0 +1,78 @@
+import gym
+
+import numpy        as np
+
+class NormalizedWrapper(gym.Wrapper):
+    """
+    :param env: (gym.Env) Gym environment that will be wrapped
+    """
+
+    def __init__(self, env):
+        # Call the parent constructor, so we can access self.env later
+        super(NormalizedWrapper, self).__init__(env)
+
+        assert isinstance(self.env.action_space,
+                          gym.spaces.Box), "This wrapper only works with continuous action space (spaces.Box)"
+        assert isinstance(self.env.observation_space,
+                          gym.spaces.Box), "This wrapper only works with continuous observation space (spaces.Box)"
+
+        # We modify the wrapper action space, so all actions will lie in [-1, 1]
+        self.action_space = gym.spaces.Box(low=-1, high=1, shape=self.env.action_space.shape, dtype=np.float32)
+        self.observation_space = gym.spaces.Box(low=-1, high=1, shape=self.env.observation_space.shape, dtype=np.float32)
+
+
+
+    def rescale_action(self, scaled_action):
+        """
+        Rescale the action from [-1, 1] to [low, high]
+        (no need for symmetric action space)
+        :param scaled_action: (np.ndarray)
+        :return: (np.ndarray)
+        """
+        return self.env.action_space.low + (
+                0.5 * (scaled_action + 1.0) * (self.env.action_space.high - self.env.action_space.low))
+
+    def scale_observation(self, observation):
+        """
+        Scale the observation to bounds [-1, 1]
+        """
+        return (2 * ((observation - self.env.observation_space.low) /
+                     (self.env.observation_space.high - self.env.observation_space.low))) - 1
+
+    def reset(self):
+        """
+        Reset the environment
+        """
+        # Reset the counter
+        return self.scale_observation(self.env.reset())
+
+    def step(self, action):
+        """
+        :param action: ([float] or int) Action taken by the agent
+        :return: (np.ndarray, float, bool, dict) observation, reward, is the episode over?, additional informations
+        """
+        # Rescale action from [-1, 1] to original [low, high] interval
+        rescaled_action = self.rescale_action(action)
+        obs, reward, done, info = self.env.step(rescaled_action)
+        return self.scale_observation(obs), reward, done, info
+
+
+class NormalizedActions(gym.ActionWrapper):
+
+    def _action(self, action):
+        low_bound   = self.action_space.low
+        upper_bound = self.action_space.high
+
+        action = low_bound + (action + 1.0) * 0.5 * (upper_bound - low_bound)
+        action = np.clip(action, low_bound, upper_bound)
+
+        return action
+
+    def _reverse_action(self, action):
+        low_bound   = self.action_space.low
+        upper_bound = self.action_space.high
+
+        action = 2 * (action - low_bound) / (upper_bound - low_bound) - 1
+        action = np.clip(action, low_bound, upper_bound)
+
+        return action