ariana sutanto commited on
Commit
6ac1f1c
1 Parent(s): dc42939
Files changed (1) hide show
  1. app.py +46 -2
app.py CHANGED
@@ -1,5 +1,6 @@
1
  import streamlit as st
2
  from datasets import load_dataset
 
3
 
4
  dataset_dict = load_dataset('HUPD/hupd',
5
  name='sample',
@@ -11,5 +12,48 @@ dataset_dict = load_dataset('HUPD/hupd',
11
  val_filing_end_date='2016-01-31',
12
  )
13
 
14
- x = st.slider('Select a value')
15
- st.write(x, 'squared is', x * x)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
  import streamlit as st
2
  from datasets import load_dataset
3
+ from transformers import AutoTokenizer, AutoModelForSequenceClassification, pipeline
4
 
5
  dataset_dict = load_dataset('HUPD/hupd',
6
  name='sample',
 
12
  val_filing_end_date='2016-01-31',
13
  )
14
 
15
+ st.title("Patentability Score")
16
+
17
+ abstracts={}
18
+ claims={}
19
+
20
+
21
+ dataset = dataset_dict["train"].shuffle(seed=42).select(range(20))
22
+
23
+ for i in range(0, 20):
24
+
25
+ abstracts[dataset['patent_number'][i]] = dataset['abstract'][i]
26
+ claims[dataset['patent_number'][i]] = dataset['claims'][i]
27
+
28
+
29
+ #def get_score(abstract):
30
+
31
+ # model = AutoModelForSequenceClassification.from_pretrained("arianasutanto/finetuned-distilbert")
32
+ # tokenizer = AutoTokenizer.from_pretrained("arianasutanto/finetuned-distilbert", pad_to_max_length=True)
33
+ #inputs = tokenizer(abstract, max_length=512, padding='max_length', truncation=True, return_tensors='pt')
34
+
35
+ #outputs = model(inputs['input_ids'], attention_mask=inputs['attention_mask'])
36
+ #scores = torch.softmax(outputs.logits, dim=1)[0]
37
+
38
+ #probs = F.softmax(scores, dim=0)
39
+ # accept_prob = probs[0].item()
40
+
41
+ #print(accept_prob)
42
+
43
+ #return #accept_prob
44
+
45
+
46
+
47
+
48
+ patent_num = st.selectbox("Choose a patent number", options=abstracts.keys())
49
+ if st.button("Submit"):
50
+ abstract = st.text_area(label="Abstract",value=abstracts[patent_num])
51
+ claim = st.text_area(label="Claims",value=claims[patent_num])
52
+ #get_score(abstract)
53
+
54
+
55
+ #abstract = abstracts[patent_num]
56
+ #st.write(abstract)
57
+ #claim = claims[patent_num]
58
+ #st.write(claim)
59
+