fork download
  1. /#Data preprocessing
  2. #importing the libraries
  3. import numpy as np
  4. import matplotlib.pyplot
  5. import pandas as pd
  6.  
  7. #importing the dataset
  8. dataset=pd.read_csv('Data.csv')
  9. X=dataset.iloc[:,:-1].values
  10. Y=dataset.iloc[:,3].values
  11.  
  12. #taking care of the missing data
  13. from sklearn.impute import SimpleImputer
  14. imputer=SimpleImputer(missing_values=np.nan, strategy='mean')
  15. #imputer=SimpleImputer()
  16. imputer=imputer.fit(X[:,1:3])#the upperbound is excluded
  17. X[:,1:3]=imputer.transform(X[:,1:3])
  18. print(X)
  19.  
  20. # Encoding categorical data
  21. # Encoding the Independent Variable Country
  22. from sklearn.preprocessing import LabelEncoder, OneHotEncoder
  23. from sklearn.compose import ColumnTransformer
  24. labelencoder_X = LabelEncoder()
  25. X[:, 0] = labelencoder_X.fit_transform(X[:, 0])
  26. columnTransformer = ColumnTransformer([('encoder', OneHotEncoder(),
  27. [0])],remainder='passthrough')
  28. X=np.array(columnTransformer.fit_transform(X),dtype=np.str)
Success #stdin #stdout 0.02s 25792KB
stdin
Standard input is empty
stdout
/#Data preprocessing 
#importing the libraries 
import numpy as np 
import matplotlib.pyplot 
import pandas as pd 
 
#importing the dataset 
dataset=pd.read_csv('Data.csv') 
X=dataset.iloc[:,:-1].values 
Y=dataset.iloc[:,3].values 
 
#taking care of the missing data 
from sklearn.impute import SimpleImputer 
imputer=SimpleImputer(missing_values=np.nan, strategy='mean') 
#imputer=SimpleImputer() 
imputer=imputer.fit(X[:,1:3])#the upperbound is excluded 
X[:,1:3]=imputer.transform(X[:,1:3]) 
print(X) 
 
# Encoding categorical data 
# Encoding the Independent Variable Country 
from sklearn.preprocessing import LabelEncoder, OneHotEncoder 
from sklearn.compose import ColumnTransformer 
labelencoder_X = LabelEncoder() 
X[:, 0] = labelencoder_X.fit_transform(X[:, 0]) 
columnTransformer = ColumnTransformer([('encoder', OneHotEncoder(), 
[0])],remainder='passthrough') 
X=np.array(columnTransformer.fit_transform(X),dtype=np.str)