gabrielthomasjacobs
init
40bd770
raw
history blame contribute delete
No virus
97 Bytes
# @package _global_
# 300M Param.
transformer_lm:
dim: 1024
num_heads: 16
num_layers: 24