all-models / rwkv /rwkv6_60.yaml
reach-vb's picture
reach-vb HF staff
Upload folder using huggingface_hub
103d46f verified
raw
history blame
No virus
571 Bytes
model:
class_path: model.lina.Lina
init_args:
n_codebook: 1024
n_special_token_in: 3
n_special_token_out: 3
n_txt_vocab: 180
d_context: 384
d_model: 512
quant_layer: [0, 1, 2, 3]
txt_encoder:
class_path: model.encoder.TextEncoder
init_args:
dim: 512
heads: 1
n_layers: 6
dropout: 0.1
attentive_rnn:
class_path: model.rwkv6x.AttentiveRWKV6
init_args:
d_model: 512
d_context: 512
heads: 1
dropout_att: 0.2
n_layer: 3
blind: True