Professional Documents
Culture Documents
Assignment 2
Assignment 2
Assignment 2
In [2]: dict1={"Maths_Score":[60,62,65,78,77,np.nan,78,80,66,67],
"Reading_Score":[70,99,90,54,89,65,80,65,89,20],
"Writing_Score":[70,43,80,56,95,56,99,45,90,100],
"Placement_Count":[np.nan,7,8,5,9,8,6,9,5,3],
"Region":[np.nan,"Buldhana","Kothrud","Baner","Nagpur","Dadar",np.nan
"Gender":["Male","Female","Female","Male","Male","Male","Female","Male
"Placement_Count_Year":[2020,2022,2018,2017,2023,2015,2012,np.nan,2010
In [3]: df=pd.DataFrame(dict1)
In [4]: df
In [5]: df.isnull().sum()
Maths_Score 1
Out[5]:
Reading_Score 0
Writing_Score 0
Placement_Count 1
Region 3
Gender 0
Placement_Count_Year 1
dtype: int64
In [6]: df.dropna()
In [7]: df.dropna(axis=1)
0 70 70 Male
1 99 43 Female
2 90 80 Female
3 54 56 Male
4 89 95 Male
5 65 56 Male
6 80 99 Female
7 65 45 Male
8 89 90 Female
9 20 100 Male
In [8]: df.dropna(how="all")
In [9]: df.dropna(thresh=2)
In [10]: df.dropna(subset=["Region","Gender"])
In [ ]:
In [11]: df
In [12]: df.replace(to_replace=np.nan,value=8)
In [13]: df["Region"].replace(to_replace=np.nan,value="Kota")
0 Kota
Out[13]:
1 Buldhana
2 Kothrud
3 Baner
4 Nagpur
5 Dadar
6 Kota
7 Wardha
8 Surat
9 Kota
Name: Region, dtype: object
In [14]: df.fillna(0)
In [15]: df["Maths_Score"]=df["Maths_Score"].fillna(df["Maths_Score"].mean())
In [16]: df
In [17]: df["Placement_Count"]=df["Placement_Count"].fillna(df["Placement_Count"].mea
In [18]: df
In [19]: df["Placement_Count_Year"]=df["Placement_Count_Year"].fillna(df["Placement_C
In [20]: df
In [23]: df["Region"]=df["Region"].fillna("Kota")
In [24]: df
In [32]: df=pd.DataFrame(dict1)
df
In [33]: df["Maths_Score"]=df["Maths_Score"].fillna(df["Maths_Score"].min())
In [34]: df
In [29]: df=pd.DataFrame(dict1)
df
In [30]: df["Maths_Score"]=df["Maths_Score"].fillna(df["Maths_Score"].max())
In [31]: df
In [35]: df=pd.DataFrame(dict1)
df
In [36]: df["Maths_Score"]=df["Maths_Score"].fillna(df["Maths_Score"].std())
In [37]: df
In [ ]: