1

I'm preparing a model using Logistic Regression but I can't seem to solve this error.

I've tried using Label Encoders but that doesn't work as well.

import pandas as pd
import numpy as np
import scipy.stats as st
import statsmodels.api as sm
import matplotlib.pyplot as plt
from sklearn import preprocessing
from sklearn import utils
import matplotlib.mlab as mlab
import scipy.optimize as opt

df=pd.read_csv('C:/Users/Sehej Bakshi/Desktop/New folder/lung_cancer.csv')
print(df.head())


import sklearn
new_features=df[['cigsPerDay', 'Age', 'BMI', 'Glucose', 'Age_of_initialization', 'Probability']]
x=new_features.iloc[:, :-1]
y=new_features.iloc[:, -1]


from sklearn.model_selection import train_test_split
x_train, x_test, y_train, y_test = train_test_split(x, y, test_size=0.2, random_state=4)

print(x_train.shape, y_train.shape)
print(x_test.shape, y_test.shape)

from sklearn.linear_model import LogisticRegression
LR=LogisticRegression(C=0.01, solver='liblinear').fit(x_train, y_train)
ypred=LR.predict(x_test)
print('Accuracy:', sklearn.metrics.accuracy_score(y_test, y_pred))

Error:

Traceback (most recent call last):
  File "C:/Python36/Hack/lg.py", line 28, in <module>
    LR=LogisticRegression(C=0.01, solver='liblinear').fit(x_train, y_train)
  File "C:\Python36\lib\site-packages\sklearn\linear_model\logistic.py", line 1533, in fit
    check_classification_targets(y)
  File "C:\Python36\lib\site-packages\sklearn\utils\multiclass.py", line 169, in check_classification_targets
    raise ValueError("Unknown label type: %r" % y_type)
ValueError: Unknown label type: 'continuous'
desertnaut
  • 57,590
  • 26
  • 140
  • 166
  • well-known problem here: https://stackoverflow.com/questions/41925157/logisticregression-unknown-label-type-continuous-using-sklearn-in-python – PV8 Nov 08 '19 at 10:43

0 Answers0