Skip to content

Commit 3d22f58

Browse files
Tune hyper params
1 parent 4515317 commit 3d22f58

4 files changed

Lines changed: 11 additions & 13 deletions

File tree

training_scripts/GPU/TEDD_1140_base.sh

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@ python3 train.py --train_new \
1616
--dropout_encoder_features 0.3 \
1717
--control_mode keyboard \
1818
--val_check_interval 0.5 \
19-
--hide_map_prob 0.4 \
2019
--devices 1
2120

2221

training_scripts/GPU/TEDD_1140_large.sh

Lines changed: 0 additions & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -16,7 +16,6 @@ python3 train.py --train_new \
1616
--dropout_encoder_features 0.3 \
1717
--control_mode keyboard \
1818
--val_check_interval 0.5 \
19-
--hide_map_prob 0.4 \
2019
--devices 1
2120

2221

training_scripts/TPU/TEDD_1140_base.sh

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -5,23 +5,23 @@ python3 train.py --train_new \
55
--val_dir ../gtaai_datasets/dev \
66
--output_dir models/tedd_1104_base \
77
--encoder_type transformer \
8-
--dataloader_num_workers 32 \
9-
--batch_size 8 \
8+
--dataloader_num_workers 16 \
9+
--batch_size 16 \
1010
--accumulation_steps 1 \
1111
--max_epochs 40 \
12-
--cnn_model_name efficientnet_b4 \
12+
--cnn_model_name convnext_base \
1313
--num_layers_encoder 4 \
1414
--embedded_size 512 \
15-
--learning_rate 1e-5 \
15+
--learning_rate 5e-5 \
1616
--mask_prob 0.2 \
1717
--dropout_cnn_out 0.3 \
1818
--dropout_encoder 0.1 \
1919
--dropout_encoder_features 0.3 \
2020
--control_mode keyboard \
2121
--val_check_interval 0.5 \
22-
--hide_map_prob 0.4 \
22+
--precision 16 \
2323
--devices 8 \
2424
--accelerator tpu \
25-
--report_to tensorboard
25+
--report_to wandb
2626

2727

training_scripts/TPU/TEDD_1140_large.sh

Lines changed: 5 additions & 5 deletions
Original file line numberDiff line numberDiff line change
@@ -5,21 +5,21 @@ python3 train.py --train_new \
55
--val_dir ../gtaai_datasets/dev \
66
--output_dir models/tedd_1104_large \
77
--encoder_type transformer \
8-
--dataloader_num_workers 32 \
8+
--dataloader_num_workers 16 \
99
--batch_size 8 \
1010
--accumulation_steps 1 \
1111
--max_epochs 40 \
12-
--cnn_model_name efficientnet_b7 \
13-
--num_layers_encoder 4 \
12+
--cnn_model_name convnext_large \
13+
--num_layers_encoder 6 \
1414
--embedded_size 512 \
15-
--learning_rate 1e-5 \
15+
--learning_rate 5e-5 \
1616
--mask_prob 0.2 \
1717
--dropout_cnn_out 0.3 \
1818
--dropout_encoder 0.1 \
1919
--dropout_encoder_features 0.3 \
2020
--control_mode keyboard \
2121
--val_check_interval 0.5 \
22-
--hide_map_prob 0.4 \
22+
--precision 16 \
2323
--devices 8 \
2424
--accelerator tpu \
2525
--report_to wandb

0 commit comments

Comments
 (0)