|
|
@ -8,7 +8,7 @@ optimizer = dict(type='AdamW', lr=5e-4, betas=(0.9, 0.999), weight_decay=0.1, |
|
|
|
constructor='LayerDecayOptimizerConstructor', |
|
|
|
paramwise_cfg=dict( |
|
|
|
num_layers=12, |
|
|
|
layer_decay_rate=0.9, |
|
|
|
layer_decay_rate=0.8, |
|
|
|
custom_keys={ |
|
|
|
'bias': dict(decay_multi=0.), |
|
|
|
'pos_embed': dict(decay_mult=0.), |
|
|
@ -54,7 +54,7 @@ model = dict( |
|
|
|
use_checkpoint=False, |
|
|
|
mlp_ratio=4, |
|
|
|
qkv_bias=True, |
|
|
|
drop_path_rate=0.3, |
|
|
|
drop_path_rate=0.1, |
|
|
|
), |
|
|
|
keypoint_head=dict( |
|
|
|
type='TopdownHeatmapSimpleHead', |
|
|
|