Spaces:

Teery
/

new_space_nlp

Sleeping

Teery commited on Sep 29, 2023

Commit

b02dea6

•

1 Parent(s): 5e65e3b

Update dopset.py

Files changed (1) hide show

dopset.py CHANGED Viewed

@@ -1,13 +1,13 @@
 import string
 import torch
 import numpy as np
-from nltk.corpus import stopwords
-stop_words = set(stopwords.words('english'))
 import torch.nn as nn
 import pickle
 from transformers import BertTokenizer, BertModel, DistilBertTokenizer, DistilBertModel
 from sklearn.linear_model import LogisticRegression
-import nltk
@@ -48,7 +48,7 @@ class LSTMClassifier(nn.Module):
 def data_preprocessing(text: str) -> str:
     text = text.lower()
     text = ''.join([c for c in text if c not in string.punctuation])# Remove punctuation
-    text = [word for word in text.split() if word not in stop_words]
     text = ' '.join(text)
     return text

 import string
 import torch
 import numpy as np
+# from nltk.corpus import stopwords
+# stop_words = set(stopwords.words('english'))
 import torch.nn as nn
 import pickle
 from transformers import BertTokenizer, BertModel, DistilBertTokenizer, DistilBertModel
 from sklearn.linear_model import LogisticRegression
+# import nltk
 def data_preprocessing(text: str) -> str:
     text = text.lower()
     text = ''.join([c for c in text if c not in string.punctuation])# Remove punctuation
+    # text = [word for word in text.split() if word not in stop_words]
     text = ' '.join(text)
     return text