tsantos commited on
Commit
6043993
1 Parent(s): 00ddc44

Update text_cleaning_transforerms.py

Browse files
Files changed (1) hide show
  1. text_cleaning_transforerms.py +5 -0
text_cleaning_transforerms.py CHANGED
@@ -5,6 +5,11 @@ from os.path import isfile, join
5
  import numpy as np
6
  import re
7
 
 
 
 
 
 
8
  from gensim.parsing import preprocessing
9
  from gensim.parsing.preprocessing import strip_tags, strip_punctuation
10
  from nltk.tokenize import word_tokenize, sent_tokenize
 
5
  import numpy as np
6
  import re
7
 
8
+ import nltk
9
+ nltk.download('punkt')
10
+ nltk.download('stopwords')
11
+ nltk.download('wordnet')
12
+
13
  from gensim.parsing import preprocessing
14
  from gensim.parsing.preprocessing import strip_tags, strip_punctuation
15
  from nltk.tokenize import word_tokenize, sent_tokenize