you_on_the_titanic / SRLib /Utilities.py
luanzitto's picture
Teste de nova restrição
a0678bc
raw
history blame contribute delete
No virus
1.03 kB
### Imports
import pickle as pkl
#Machine Learning
from sklearn.linear_model import RidgeClassifierCV
class encoding():
def full_pipeline(data_raw):
### Rescaling
mms_age = pkl.load( open( './models/mms_age.sav', 'rb' ) )
mms_sibsp = pkl.load( open( './models/mms_sibsp.sav', 'rb' ) )
mms_fare = pkl.load( open( './models/mms_fare.sav', 'rb' ) )
mms_pclass = pkl.load( open( './models/mms_pclass.sav', 'rb' ) )
df = data_raw[[ 'Sex']]
df['Age'] = mms_age.transform( data_raw[['Age']].values )
df['SibSp'] = mms_sibsp.transform( data_raw[['SibSp']].values )
df['Fare'] = mms_fare.transform( data_raw[['Fare']].values )
df['Pclass'] = mms_pclass.transform( data_raw[['Pclass']].values )
df['__Mr'] = df.Sex.apply( lambda x : 1 if x == 0 else 0)
### Feature Selection
df = df[['Fare', 'Age', 'Sex', 'Pclass', '__Mr', 'SibSp']]
return df
###-