mirror of
https://github.com/RYDE-WORK/lnp_ml.git
synced 2026-03-21 09:36:32 +08:00
16 lines
337 B
JSON
16 lines
337 B
JSON
{
|
|
"d_model": 256,
|
|
"num_heads": 8,
|
|
"n_attn_layers": 4,
|
|
"fusion_strategy": "attention",
|
|
"head_hidden_dim": 128,
|
|
"dropout": 0.1,
|
|
"use_mpnn": true,
|
|
"lr": 0.0001,
|
|
"weight_decay": 1e-05,
|
|
"batch_size": 32,
|
|
"epochs": 100,
|
|
"patience": 15,
|
|
"init_from_pretrain": "models/pretrain_delivery.pt",
|
|
"freeze_backbone": false
|
|
} |