Tom Aarsen commited on
Commit
790cf31
2 Parent(s): 45757a5 048345c

Merge branch 'main' into integration/sentence_transformers

Browse files
Files changed (2) hide show
  1. README.md +1 -0
  2. config.json +3 -3
README.md CHANGED
@@ -2685,6 +2685,7 @@ sentences = ['What is TSNE?', 'Who is Laurens van der Maaten?']
2685
 
2686
  tokenizer = AutoTokenizer.from_pretrained('bert-base-uncased')
2687
  model = AutoModel.from_pretrained('nomic-ai/nomic-embed-text-v1', trust_remote_code=True)
 
2688
 
2689
  encoded_input = tokenizer(sentences, padding=True, truncation=True, return_tensors='pt')
2690
 
 
2685
 
2686
  tokenizer = AutoTokenizer.from_pretrained('bert-base-uncased')
2687
  model = AutoModel.from_pretrained('nomic-ai/nomic-embed-text-v1', trust_remote_code=True)
2688
+ model.eval()
2689
 
2690
  encoded_input = tokenizer(sentences, padding=True, truncation=True, return_tensors='pt')
2691
 
config.json CHANGED
@@ -12,7 +12,7 @@
12
  "bos_token_id": null,
13
  "causal": false,
14
  "dense_seq_output": true,
15
- "embd_pdrop": 0.1,
16
  "eos_token_id": null,
17
  "fused_bias_fc": true,
18
  "fused_dropout_add_ln": true,
@@ -32,7 +32,7 @@
32
  "prenorm": false,
33
  "qkv_proj_bias": false,
34
  "reorder_and_upcast_attn": false,
35
- "resid_pdrop": 0.1,
36
  "rotary_emb_base": 1000,
37
  "rotary_emb_fraction": 1.0,
38
  "rotary_emb_interleaved": false,
@@ -41,7 +41,7 @@
41
  "scale_attn_by_inverse_layer_idx": false,
42
  "scale_attn_weights": true,
43
  "summary_activation": null,
44
- "summary_first_dropout": 0.1,
45
  "summary_proj_to_labels": true,
46
  "summary_type": "cls_index",
47
  "summary_use_proj": true,
 
12
  "bos_token_id": null,
13
  "causal": false,
14
  "dense_seq_output": true,
15
+ "embd_pdrop": 0.0,
16
  "eos_token_id": null,
17
  "fused_bias_fc": true,
18
  "fused_dropout_add_ln": true,
 
32
  "prenorm": false,
33
  "qkv_proj_bias": false,
34
  "reorder_and_upcast_attn": false,
35
+ "resid_pdrop": 0.0,
36
  "rotary_emb_base": 1000,
37
  "rotary_emb_fraction": 1.0,
38
  "rotary_emb_interleaved": false,
 
41
  "scale_attn_by_inverse_layer_idx": false,
42
  "scale_attn_weights": true,
43
  "summary_activation": null,
44
+ "summary_first_dropout": 0.0,
45
  "summary_proj_to_labels": true,
46
  "summary_type": "cls_index",
47
  "summary_use_proj": true,