lixiangchun commited on
Commit
dc0bd2a
1 Parent(s): a3b02b5

update README

Browse files
Files changed (3) hide show
  1. README.md +5 -5
  2. pbmc_label.txt.gz +3 -0
  3. pbmc_ranking.txt.gz +3 -0
README.md CHANGED
@@ -24,17 +24,17 @@ class LineDataset(Dataset):
24
  device = "cuda" if torch.cuda.is_available() else "cpu"
25
  torch.set_num_threads(2)
26
 
27
- tokenizer = PreTrainedTokenizerFast.from_pretrained("lixiangchun/transcriptome_iseeek_13millioncells_128tokens")
28
- model = BertForMaskedLM.from_pretrained("lixiangchun/transcriptome_iseeek_13millioncells_128tokens").bert
29
  model = model.to(device)
30
  model.eval()
31
 
32
 
33
- text_file = "/mnt/ssd2/shenhr/BERT/bert_256/pbmc/deal/gene_rank_pmbc.txt"
34
- labels = [s.strip() for s in open('/mnt/ssd2/shenhr/BERT/bert_256/pbmc/deal/labels.txt')]
 
35
  labels = np.asarray(labels)
36
 
37
- lines = [s.strip() for s in open(text_file)]
38
 
39
  ds = LineDataset(lines)
40
  dl = DataLoader(ds, batch_size=80)
 
24
  device = "cuda" if torch.cuda.is_available() else "cpu"
25
  torch.set_num_threads(2)
26
 
27
+ tokenizer = PreTrainedTokenizerFast.from_pretrained("TJMUCH/transcriptome-iseeek")
28
+ model = BertForMaskedLM.from_pretrained("TJMUCH/transcriptome-iseeek").bert
29
  model = model.to(device)
30
  model.eval()
31
 
32
 
33
+ ## Data desposited in https://huggingface.co/TJMUCH/transcriptome-iseeek/tree/main
34
+ lines = [s.strip() for s in gzip.open("pbmc_ranking.txt.gz")]
35
+ labels = [s.strip() for s in gzip.open("pbmc_label.txt.gz")]
36
  labels = np.asarray(labels)
37
 
 
38
 
39
  ds = LineDataset(lines)
40
  dl = DataLoader(ds, batch_size=80)
pbmc_label.txt.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d6171759c36f7c45d9a8230bd2fd0af192a8f12d2b7bbb9d838d6a0d589f9f24
3
+ size 25295
pbmc_ranking.txt.gz ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:588a33ccabe070aa97b6d2580fc8eb3dc16cc4bedc2baaed55b80312dac40d77
3
+ size 26121005