adefossez's picture
updated demo
a16e65e
raw
history blame
109 Bytes
# @package _global_
# gpt2 like (~1.5B params)
transformer_lm:
dim: 1536
num_heads: 24
num_layers: 48