{
  "d_model": 256,
  "nhead": 4,
  "codec_dim": 128,
  "text_vocab_size": 256,
  "text_encoder_layers": 4,
  "predictor_layers": 6,
  "dropout": 0.1,
  "pred_weight": 10.0,
  "roundtrip_weight": 1.0,
  "ema_decay": 0.998,
  "input_noise": 0.0
}