This project is a multi-agent reinforcement learning project that uses MAPPO and MADDPG algorithms to train a group of drones. The drones are trained in a simulated environment adopted from Gym-PyBullet-Drones.
python3 -m pip install -e .gui=False
record_video=True
n_gpu = 1
algo_type = "hover"
action_type = "pid"
python scripts/learning/singleagent_ppo.py \
--env=$algo_type \
--act=$action_type \
--record_video=$record_video \
--gui=$guigui=False
record_video=True
n_gpu = 1
algo_type = "hover"
action_type = "pid"
python scripts/learning/singleagent_ddpg.py \
--env=$algo_type \
--act=$action_type \
--record_video=$record_video \
--gui=$guiFor Training:
gui=False
record_video=True
num_drones = 2
n_gpu = 0
algo_type = "flock"
RLLIB_NUM_GPUS=$n_gpu \
python scripts/learning/multiagent_ppo.py \
--env $algo_type \
--num_drones $num_drones \
--record_video=$record_video \
--gui=$guiFor Testing:
colab=True
gui=False
record_video=True
result_folder="./results/save-flock-2-cc-kin-rpm-08.21.2023_13.55.36"
python scripts/learning/test_multiagent_ppo.py \
--exp $result_folder \
--record_video=$record_video \
--gui=$gui \
--colab=$colabFor Training:
gui=False
record_video=True
num_drones = 2
n_gpu = 0
algo_type = "flock"
RLLIB_NUM_GPUS=$n_gpu \
python scripts/learning/multiagent_ddpg.py \
--env $algo_type \
--num_drones $num_drones \
--record_video=$record_video \
--gui=$guiFor Testing:
colab=True
gui=False
record_video=True
result_folder="./results/save-flock-2-cc-kin-rpm-08.21.2023_13.55.36"
python scripts/learning/test_multiagent_ddpg.py \
--exp $result_folder \
--record_video=$record_video \
--gui=$gui \
--colab=$colabcsv = "./results/save-flock-2-cc-kin-rpm-08.21.2023_13.55.36/DDPG/progress.csv"
label = "Multi-Agent DDPG"
python scripts/visualize/results.py \
--csv $csv \
--label $label