Update oneclass.py
Browse files- oneclass.py +2 -2
oneclass.py
CHANGED
@@ -2,7 +2,7 @@ import pandas as pd
|
|
2 |
from sklearn.feature_extraction.text import TfidfVectorizer
|
3 |
from sklearn.svm import OneClassSVM
|
4 |
|
5 |
-
def select_top_n_papers(n, positive_csv_file, unlabelled_csv_file):
|
6 |
# Load the positive labelled and unlabelled data
|
7 |
positive_labelled_info = pd.read_csv(positive_csv_file)
|
8 |
unlabelled_labelled = pd.read_csv(unlabelled_csv_file)
|
@@ -16,7 +16,7 @@ def select_top_n_papers(n, positive_csv_file, unlabelled_csv_file):
|
|
16 |
X_pos = vectorizer.fit_transform(positive_labelled_info['text'])
|
17 |
|
18 |
# Train a one-class SVM model
|
19 |
-
clf = OneClassSVM(kernel='rbf', nu=
|
20 |
clf.fit(X_pos)
|
21 |
|
22 |
# Transform unlabelled data using the same vectorizer
|
|
|
2 |
from sklearn.feature_extraction.text import TfidfVectorizer
|
3 |
from sklearn.svm import OneClassSVM
|
4 |
|
5 |
+
def select_top_n_papers(n, positive_csv_file, unlabelled_csv_file,nu):
|
6 |
# Load the positive labelled and unlabelled data
|
7 |
positive_labelled_info = pd.read_csv(positive_csv_file)
|
8 |
unlabelled_labelled = pd.read_csv(unlabelled_csv_file)
|
|
|
16 |
X_pos = vectorizer.fit_transform(positive_labelled_info['text'])
|
17 |
|
18 |
# Train a one-class SVM model
|
19 |
+
clf = OneClassSVM(kernel='rbf', nu=nu) # Adjust parameters as needed
|
20 |
clf.fit(X_pos)
|
21 |
|
22 |
# Transform unlabelled data using the same vectorizer
|