File size: 1,031 Bytes
c52bf18
 
 
 
 
 
 
 
 
 
 
 
 
 
60dfd5b
 
 
 
c52bf18
 
 
 
 
 
a0678bc
c52bf18
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
### Imports
import pickle as pkl


#Machine Learning
from sklearn.linear_model    import RidgeClassifierCV


class encoding():    

     
    def full_pipeline(data_raw):
        
        ### Rescaling
        mms_age    = pkl.load( open( './models/mms_age.sav', 'rb' ) )
        mms_sibsp  = pkl.load( open( './models/mms_sibsp.sav', 'rb' ) )
        mms_fare   = pkl.load( open( './models/mms_fare.sav', 'rb' ) )
        mms_pclass = pkl.load( open( './models/mms_pclass.sav', 'rb' ) )

        df = data_raw[[ 'Sex']]        
        df['Age']     = mms_age.transform( data_raw[['Age']].values )
        df['SibSp']   = mms_sibsp.transform( data_raw[['SibSp']].values )
        df['Fare']    = mms_fare.transform( data_raw[['Fare']].values )
        df['Pclass']  = mms_pclass.transform( data_raw[['Pclass']].values ) 
        df['__Mr']    = df.Sex.apply( lambda x : 1 if x == 0 else 0) 

        ### Feature Selection
        df = df[['Fare', 'Age', 'Sex', 'Pclass', '__Mr', 'SibSp']]
        
        return df   


    ###-