Spaces:

Djacon
/

text2feature

Running

Djacon commited on Nov 27, 2023

Commit

70d5d1d

•

1 Parent(s): 6c4629b

Add nltk punct

Files changed (3) hide show

README.md CHANGED Viewed

@@ -1,6 +1,6 @@
 ---
 title: Emotion Detection
-emoji: 🐠
 colorFrom: blue
 colorTo: yellow
 sdk: docker

 ---
 title: Emotion Detection
+emoji: 📝➡️🚀
 colorFrom: blue
 colorTo: yellow
 sdk: docker

extract.py CHANGED Viewed

@@ -1,5 +1,5 @@
-# import nltk
-# nltk.download('punkt')
 from nltk.cluster.util import cosine_distance
 from nltk.tokenize import sent_tokenize, word_tokenize
@@ -54,7 +54,7 @@ def get_pagerank(importance, top_k):
 def summarize_text(text: str) -> str:
-    return text
     sentences = sent_tokenize(text)[:2000]
     top_k = max(20, int(len(sentences) ** .5))
     mat = build_matrix(sentences)

+import nltk
+nltk.download('punkt')
 from nltk.cluster.util import cosine_distance
 from nltk.tokenize import sent_tokenize, word_tokenize
 def summarize_text(text: str) -> str:
+    # return text
     sentences = sent_tokenize(text)[:2000]
     top_k = max(20, int(len(sentences) ** .5))
     mat = build_matrix(sentences)

inference.py CHANGED Viewed

@@ -27,6 +27,7 @@ def predict_emotions(text: str) -> str:
     return '\n'.join(f"{k}: {v}%" for k, v in sorted(emotions_list.items(),
                                                     key=lambda x: -x[1]))
 path_gram = './models/mbert-gram/'
 model_gram = BertForSequenceClassification.from_pretrained(path_gram)
 tokenizer_gram = AutoTokenizer.from_pretrained(path_gram)

     return '\n'.join(f"{k}: {v}%" for k, v in sorted(emotions_list.items(),
                                                     key=lambda x: -x[1]))
+# path_gram = 'Djacon/mbert-gram'
 path_gram = './models/mbert-gram/'
 model_gram = BertForSequenceClassification.from_pretrained(path_gram)
 tokenizer_gram = AutoTokenizer.from_pretrained(path_gram)