michal commited on
Commit
4c15272
1 Parent(s): 57e8993

dataset switch

Browse files
Files changed (1) hide show
  1. app.py +4 -2
app.py CHANGED
@@ -51,10 +51,12 @@ bi_encoder.max_seq_length = 256 # Truncate long passages to 256 tokens
51
  cross_encoder = CrossEncoder('cross-encoder/ms-marco-MiniLM-L-6-v2')
52
 
53
  """# import datasets"""
54
- dataset = load_dataset("gfhayworth/wiki_mini", split='train')
 
55
  mypassages = list(dataset.to_pandas()['psg'])
56
 
57
- dataset_embed = load_dataset("gfhayworth/wiki_mini_embed", split='train')
 
58
  dataset_embed_pd = dataset_embed.to_pandas()
59
  mycorpus_embeddings = torch_tensor(dataset_embed_pd.values)
60
 
 
51
  cross_encoder = CrossEncoder('cross-encoder/ms-marco-MiniLM-L-6-v2')
52
 
53
  """# import datasets"""
54
+ dataset = load_dataset("gfhayworth/hack_policy", split='train')
55
+
56
  mypassages = list(dataset.to_pandas()['psg'])
57
 
58
+ dataset_embed = load_dataset("gfhayworth/hack_policy_embed", split='train')
59
+
60
  dataset_embed_pd = dataset_embed.to_pandas()
61
  mycorpus_embeddings = torch_tensor(dataset_embed_pd.values)
62