-
Notifications
You must be signed in to change notification settings - Fork 3
/
Copy pathtrain.sh
executable file
·38 lines (31 loc) · 1.18 KB
/
train.sh
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
#!/bin/sh
seed_max=1
log_level="NOTICE"
export DEBUG=0
export TRAIN=1
export EVAL=0
scenario="RANDOM"
accelerate=1200 # 1 step = 0.02 * 1200 = 24 s
n_training_threads=4
n_rollout_threads=42
num_env_steps=$((25200 * 60)) # steps_per_episode * episodes
experiment="check"
algo="mappo"
gamma=0.99
gain=0.01
lr=5e-4
critic_lr=$lr
value_loss_coef=1
ppo_epoch=10
num_mini_batch=1
w_qos=4
w_xqos=0.005
log_interval=1
wandb_user="YOUR_WANDB_USER_NAME"
wandb_api_key="YOUR_WANDB_API_KEY"
echo "algo is ${algo}, traffic scenario is ${scenario}, max seed is ${seed_max}"
for seed in `seq ${seed_max}`;
do
echo "seed is ${seed}:"
CUDA_VISIBLE_DEVICES=0 python train.py --algorithm_name ${algo} --experiment_name ${experiment} --scenario ${scenario} --accelerate ${accelerate} --seed ${seed} --n_training_threads ${n_training_threads} --n_rollout_threads ${n_rollout_threads} --num_mini_batch ${num_mini_batch} --num_env_steps ${num_env_steps} --ppo_epoch ${ppo_epoch} --gain ${gain} --gamma ${gamma} --lr ${lr} --critic_lr ${critic_lr} --value_loss_coef ${value_loss_coef} --user_name ${wandb_user} --log_level ${log_level} --log_interval ${log_interval} --w_qos ${w_qos} --w_xqos ${w_xqos} $@
done