Carlos-Francisco Méndez-Cruz

Final version binClass for papers

......@@ -64,7 +64,7 @@ if args.traind and not args.input:
# CMC: separate in training - validation datasets
if args.split:
X_train, X_test, y_train, y_test = train_test_split(data.data, labels, test_size = 0.25, random_state = 42)
X_train, X_test, y_train, y_test = train_test_split(data.data, data.target, test_size = 0.25, random_state = 42)
tfidf_model = vectorizer.fit(X_train)
X = vectorizer.transform(X_train)
y = y_train
......