codewithdark's picture
Initial model and tokenizer commit
adf4ac7
raw
history blame
245 Bytes
{
"architectures": [
"LatentRecurrentDepthModel"
],
"d_model": 768,
"dropout": 0.1,
"model_type": "latent_recurrent_depth",
"num_heads": 12,
"torch_dtype": "float32",
"transformers_version": "4.48.3",
"vocab_size": 50257
}