Spaces:

lora-x
/

Backpack

Runtime error

Lora commited on Jul 11, 2023

Commit

97ff57c

•

1 Parent(s): 71ffc8f

remove old sense files

Files changed (4) hide show

.gitignore ADDED Viewed

	@@ -0,0 +1 @@


1	+ gradio_cached_examples/

senses/all_vecs_mtx.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:1f0c9de5688dd793470c40ebc3b49c29be6ddbf9a38804bca64512940671e129
-size 2470232826

senses/lm_head.pt DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:f94054e64b4d1a07e18443769df4d3b9e346c00b02ffe4e9579e8313034dac24
-size 154411755

senses/use_senses.py DELETED Viewed

@@ -1,44 +0,0 @@
-"""Visualize some sense vectors"""
-import torch
-import argparse
-import transformers
-def visualize_word(word, tokenizer, vecs, lm_head, count=20, contents=None):
-  """
-  Prints out the top-scoring words (and lowest-scoring words) for each sense.
-  """
-  if contents is None:
-    print(word)
-    token_id = tokenizer(word)['input_ids'][0]
-    contents = vecs[token_id] # torch.Size([16, 768])
-  for i in range(contents.shape[0]):
-    print('~~~~~~~~~~~~~~~~~~~~~~~{}~~~~~~~~~~~~~~~~~~~~~~~~'.format(i))
-    logits = contents[i,:] @ lm_head.t() # (vocab,)    [768] @ [768, 50257] -> [50257]
-    sorted_logits, sorted_indices = torch.sort(logits, descending=True)
-    print('~~~Positive~~~')
-    for j in range(count):
-      print(tokenizer.decode(sorted_indices[j]), '\t','{:.2f}'.format(sorted_logits[j].item()))
-    print('~~~Negative~~~')
-    for j in range(count):
-      print(tokenizer.decode(sorted_indices[-j-1]), '\t','{:.2f}'.format(sorted_logits[-j-1].item()))
-  return contents
-  print()
-  print()
-  print()
-argp = argparse.ArgumentParser()
-argp.add_argument('vecs_path')
-argp.add_argument('lm_head_path')
-args = argp.parse_args()
-# Load tokenizer and parameters
-tokenizer = transformers.AutoTokenizer.from_pretrained('gpt2')
-vecs = torch.load(args.vecs_path)
-lm_head = torch.load(args.lm_head_path)
-visualize_word(input('Enter a word:'), tokenizer, vecs, lm_head, count=5)