awni00 commited on
Commit
28d41a1
1 Parent(s): c8efbd5

Push model using huggingface_hub.

Browse files
Files changed (3) hide show
  1. README.md +9 -0
  2. config.json +37 -0
  3. model.safetensors +3 -0
README.md ADDED
@@ -0,0 +1,9 @@
 
 
 
 
 
 
 
 
 
 
1
+ ---
2
+ tags:
3
+ - model_hub_mixin
4
+ - pytorch_model_hub_mixin
5
+ ---
6
+
7
+ This model has been pushed to the Hub using the [PytorchModelHubMixin](https://huggingface.co/docs/huggingface_hub/package_reference/mixins#huggingface_hub.PyTorchModelHubMixin) integration:
8
+ - Library: [More Information Needed]
9
+ - Docs: [More Information Needed]
config.json ADDED
@@ -0,0 +1,37 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "activation": "gelu",
3
+ "bias": false,
4
+ "d_model": 2048,
5
+ "dff": null,
6
+ "dropout_rate": 0.0,
7
+ "max_block_size": 1024,
8
+ "n_heads_ra": 16,
9
+ "n_heads_sa": 16,
10
+ "n_layers": 24,
11
+ "norm_first": true,
12
+ "pos_enc_type": "RoPE",
13
+ "ra_kwargs": {
14
+ "n_kv_heads": 8,
15
+ "n_relations": 64,
16
+ "rel_activation": "identity",
17
+ "rel_proj_dim": 16,
18
+ "symmetric_rels": false
19
+ },
20
+ "ra_type": "relational_attention",
21
+ "sa_kwargs": {
22
+ "n_kv_heads": 8
23
+ },
24
+ "share_attn_params": false,
25
+ "symbol_retrieval": "symbolic_attention",
26
+ "symbol_retrieval_kwargs": {
27
+ "d_model": 2048,
28
+ "n_heads": 8,
29
+ "n_symbols": 2048,
30
+ "trainable_symbols": false
31
+ },
32
+ "symbol_retriever_config": {
33
+ "shared_symbol_retriever": true,
34
+ "weight_tie_symbol_library": false
35
+ },
36
+ "vocab_size": 50304
37
+ }
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:df923a992ad5c7787e9c138d94e3c8761f72456ebf621deae5028551c0494083
3
+ size 5101083552