AMix-1-1.7B / .hydra /config.yaml
fdu-lcz's picture
Upload config.yaml
179ab70 verified
raw
history blame contribute delete
652 Bytes
model:
_target_: model.ProfileBFNModule
bfn:
_target_: model.ProfileBFN
cfg:
num_diffusion_timesteps: 100
gradient_ckpt: false
beta1: 1.0
beta_time_order: 2.0
infer_start: 0.2
net:
_target_: model.EsmForBFN
config:
pretrained_model_name_or_path: facebook/esm2_t30_150M_UR50D
token_dropout: false
_attn_implementation_autoset: true
_attn_implementation: sdpa
hidden_size: 1680
num_hidden_layers: 48
num_attention_heads: 40
intermediate_size: 6720
load_pretrained_ckpt: null
criterion: null
optimizer: null
scheduler: null