Profluent-Bio
/

E1-300m

Model card Files Files and versions

sjain-profluent commited on Nov 10, 2025

Commit

b06fe2d

·

verified ·

1 Parent(s): f61b414

Upload 2 files

Files changed (2) hide show

config.json +4 -3
model.safetensors +1 -1

config.json CHANGED Viewed

@@ -4,6 +4,7 @@
   ],
   "bos_token_id": 1,
   "clip_qkv": 8,
   "eos_token_id": 2,
   "gated_mlp": true,
   "global_attention_every_n_layers": 3,
@@ -15,7 +16,7 @@
   "max_num_positions_global": 65536,
   "max_num_positions_within_seq": 8192,
   "max_num_sequences": 512,
-  "model_type": "e1",
   "no_ffn_gradient_checkpointing": true,
   "num_attention_heads": 16,
   "num_hidden_layers": 20,
@@ -25,7 +26,7 @@
   "rope_theta_global": 500000.0,
   "rope_theta_within_seq": 10000.0,
   "tie_word_embeddings": false,
-  "torch_dtype": "bfloat16",
-  "transformers_version": "4.48.3",
   "vocab_size": 34
 }

   ],
   "bos_token_id": 1,
   "clip_qkv": 8,
+  "dtype": "bfloat16",
   "eos_token_id": 2,
   "gated_mlp": true,
   "global_attention_every_n_layers": 3,
   "max_num_positions_global": 65536,
   "max_num_positions_within_seq": 8192,
   "max_num_sequences": 512,
+  "model_type": "E1",
   "no_ffn_gradient_checkpointing": true,
   "num_attention_heads": 16,
   "num_hidden_layers": 20,
   "rope_theta_global": 500000.0,
   "rope_theta_within_seq": 10000.0,
   "tie_word_embeddings": false,
+  "transformers_version": "4.56.2",
+  "use_cache": true,
   "vocab_size": 34
 }

model.safetensors CHANGED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:59e20eecb66d8470fbd78b3c190b1045242541ae990f1e0e57991d83a5a5932a
 size 548657620

 version https://git-lfs.github.com/spec/v1
+oid sha256:31e09a2542f45b04e6ce4adafb3b657f21e2d56d12bf68fd2266b1576a80bc9b
 size 548657620