alexkueck commited on
Commit
9df3da3
1 Parent(s): 5e025c2

Update utils.py

Browse files
Files changed (1) hide show
  1. utils.py +1 -1
utils.py CHANGED
@@ -147,7 +147,7 @@ def normalise_prompt (prompt):
147
  nltk.download('stopwords')
148
  stop_words = set(stopwords.words('english'))
149
  tokens = [word for word in tokens if not word in stop_words]
150
- # 5. Lemmatization - worte gruppieren, die ähnlich sind
151
  nltk.download('wordnet')
152
  lemmatizer = WordNetLemmatizer()
153
  tokens = [lemmatizer.lemmatize(word) for word in tokens]
 
147
  nltk.download('stopwords')
148
  stop_words = set(stopwords.words('english'))
149
  tokens = [word for word in tokens if not word in stop_words]
150
+ # 5. Lemmatisierung: Worte in Grundform bringen, um Text besser vergleichen zu können
151
  nltk.download('wordnet')
152
  lemmatizer = WordNetLemmatizer()
153
  tokens = [lemmatizer.lemmatize(word) for word in tokens]