arjunpatel commited on
Commit
2840a75
1 Parent(s): 553a723

Fix a space specific error on NLTK input

Browse files
Files changed (1) hide show
  1. data_cleaning.py +2 -0
data_cleaning.py CHANGED
@@ -5,6 +5,8 @@ import re
5
 
6
  from nltk.tokenize import word_tokenize, sent_tokenize
7
  from nltk.stem import PorterStemmer
 
 
8
 
9
  from textacy.preprocessing.remove import accents, brackets, punctuation
10
  from textacy.preprocessing.replace import numbers, urls
 
5
 
6
  from nltk.tokenize import word_tokenize, sent_tokenize
7
  from nltk.stem import PorterStemmer
8
+ import nltk
9
+ nltk.download('punkt')
10
 
11
  from textacy.preprocessing.remove import accents, brackets, punctuation
12
  from textacy.preprocessing.replace import numbers, urls