Professional Documents
Culture Documents
Assignments - Day 2 - Jupyter Notebook
Assignments - Day 2 - Jupyter Notebook
In [61]: data.head()
In [62]: data.tail()
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 150 entries, 0 to 149
Data columns (total 5 columns):
# Column Non-Null Count Dtype
--- ------ -------------- -----
0 150 150 non-null float64
1 4 150 non-null float64
2 setosa 150 non-null float64
3 versicolor 150 non-null float64
4 disorder 150 non-null object
dtypes: float64(4), object(1)
memory usage: 6.0+ KB
In [64]: data.describe()
In [76]: #3)perform standard scalar min/max scalar, uniform scalar operations on same
In [81]: # Extract the numerical features (assuming they are all numeric in this case
numeric_features = data.drop('versicolor', axis=1)
# StandardScaler
standard_scaler = StandardScaler()
#standard_scaled_data = standard_scaler.fit_transform(numeric_features)
iris_df_standard_scaled = pd.DataFrame(standard_scaled_data, columns=numeric
iris_df_standard_scaled
In [82]: # MinMaxScaler
min_max_scaler = MinMaxScaler()
min_max_scaled_data = min_max_scaler.fit_transform(numeric_features)
iris_df_min_max_scaled = pd.DataFrame(min_max_scaled_data, columns=numeric_f
iris_df_min_max_scaled
In [84]: #4)check any null values in the dataset if present replace with zeros
In [46]: iris_df.isnull()
In [50]: iris_df=iris_df.fillna(0,inplace=True)
In [ ]: #5)apply principle component analaysis,smoete operations on same dataset
In [ ]:
In [ ]:
In [51]: #6)separate the columns of dataset into independent variable, depended varia