Download as pdf or txt
Download as pdf or txt
You are on page 1of 8

9/20/2020 Assignment

Assignment
Name: Md. Nasim Uddin
ID: 15162103276
Intake: 32
Section: 07

In [93]: import pandas as pd


import numpy as np
df=pd.read_csv("HospitalTestData.csv")
df.head()

Out[93]:
age %fat

0 23 9.5

1 23 26.5

2 27 7.8

3 27 17.8

4 39 31.4

In [94]: class Mean:


def calculation(self,age_size,age):
sum=0
for i in range (age_size):
sum=sum+age[i]
sum=sum/age_size
return sum

localhost:8888/nbconvert/html/Assignment.ipynb?download=false 1/8
9/20/2020 Assignment

In [95]: obj=Mean()
mean_of_age=obj.calculation(len(np.array(df.age)),np.array(df.age))
mean_of_fat=obj.calculation(len(np.array(df['%fat'])),np.array(df['%fat']))
print("mean_of_age = ",mean_of_age)
print("mean_of_%fat= ",mean_of_fat)

mean_of_age = 46.44444444444444
mean_of_%fat= 28.783333333333328

In [96]: class Median:


def calculation(self,age_size,age):
sum=0
if age_size%2==0:
sum=age_size/2
sum=(age[int(sum)]+age[int(sum-1)])/2
return sum
else:
sum=int(age_size/2)+1
return age[sum]

In [97]: obj2=Median()
sorted_the_array=np.sort(np.array(df.age))
sorted_the_array2=np.sort(np.array(df['%fat']))
median_of_age=obj2.calculation(len(np.array(df.age)),sorted_the_array)
median_of_fat=obj2.calculation(len(np.array(df['%fat'])),sorted_the_array2)
print("median_of_age = ",median_of_age)
print("median_of_%fat = ",median_of_fat)

median_of_age = 51.0
median_of_%fat = 30.7

In [98]: import math


class standard_deviation:
def calculation(self,age_size,age,m):
sum=0
for i in range(age_size):
age[i]=(age[i]-m)**2
sum=np.sum(age)
sum=math.sqrt(sum/age_size)
return sum

localhost:8888/nbconvert/html/Assignment.ipynb?download=false 2/8
9/20/2020 Assignment

In [99]: obj3=standard_deviation()
std_of_age=obj3.calculation(len(np.array(df.age)),np.array(df.age),mean_of_age)
std_of_fat=obj3.calculation(len(np.array(df['%fat'])),np.array(df['%fat']),mean_of_fat)
print("std_of_age = ",std_of_age)
print("std_of_%fat = ",std_of_fat)

std_of_age = 12.827920936595904
std_of_%fat = 8.993655170915401

In [100]: print("mean_of_age = ",mean_of_age)


print("mean_of_%fat= ",mean_of_fat)
print("****************************")
print("median_of_age = ",median_of_age)
print("median_of_%fat = ",median_of_fat)
print("****************************")
print("std_of_age = ",std_of_age)
print("std_of_%fat = ",std_of_fat)

mean_of_age = 46.44444444444444
mean_of_%fat= 28.783333333333328
****************************
median_of_age = 51.0
median_of_%fat = 30.7
****************************
std_of_age = 12.827920936595904
std_of_%fat = 8.993655170915401

In [101]: import matplotlib.pyplot as plt

localhost:8888/nbconvert/html/Assignment.ipynb?download=false 3/8
9/20/2020 Assignment

In [102]: plt.boxplot(df.age)

Out[102]: {'whiskers': [<matplotlib.lines.Line2D at 0x1ced01d0160>,


<matplotlib.lines.Line2D at 0x1ced01d0220>],
'caps': [<matplotlib.lines.Line2D at 0x1ced01d0b20>,
<matplotlib.lines.Line2D at 0x1ced01d0be0>],
'boxes': [<matplotlib.lines.Line2D at 0x1cecebb2ac0>],
'medians': [<matplotlib.lines.Line2D at 0x1ced017c940>],
'fliers': [<matplotlib.lines.Line2D at 0x1ced017c7c0>],
'means': []}

localhost:8888/nbconvert/html/Assignment.ipynb?download=false 4/8
9/20/2020 Assignment

In [103]: plt.boxplot(df['%fat'])

Out[103]: {'whiskers': [<matplotlib.lines.Line2D at 0x1cece176b80>,


<matplotlib.lines.Line2D at 0x1cece176a60>],
'caps': [<matplotlib.lines.Line2D at 0x1cececd25b0>,
<matplotlib.lines.Line2D at 0x1cececd29d0>],
'boxes': [<matplotlib.lines.Line2D at 0x1cecec25fa0>],
'medians': [<matplotlib.lines.Line2D at 0x1cececd2940>],
'fliers': [<matplotlib.lines.Line2D at 0x1cececd2b20>],
'means': []}

localhost:8888/nbconvert/html/Assignment.ipynb?download=false 5/8
9/20/2020 Assignment

In [104]: x=df['age']
y=df['%fat']
plt.xlabel('Age')
plt.ylabel('%Fat')
plt.scatter(x,y,s=200,c='green',marker='X',edgecolors='black',linewidths=1,alpha=0.75)
plt.show()

localhost:8888/nbconvert/html/Assignment.ipynb?download=false 6/8
9/20/2020 Assignment

In [105]: plt.xlabel('Age')
plt.ylabel('%Fat')
plt.plot(df['age'],df['%fat'])
plt.show()

In [106]: from sklearn.preprocessing import MinMaxScaler


scaler=MinMaxScaler()

In [107]: cols=['age','%fat']
df[cols]=scaler.fit_transform(df[cols])
df.head()

Out[107]:
age %fat

0 0.000000 0.048991

1 0.000000 0.538905

2 0.105263 0.000000

3 0.105263 0.288184

4 0.421053 0.680115

localhost:8888/nbconvert/html/Assignment.ipynb?download=false 7/8
9/20/2020 Assignment

In [108]: x=df['age']
y=df['%fat']
plt.title('q-q plot')
plt.xlabel('Age')
plt.ylabel('%Fat')
plt.scatter(x,y,s=200,c='green',marker='X',edgecolors='black',linewidths=1,alpha=0.75)
plt.plot([0,0.1,0.2,0.3,0.4,0.5,0.6,0.7,0.8,0.9,1],[0,0.1,0.2,0.3,0.4,0.5,0.6,0.7,0.8,0.9,1])
plt.show()

localhost:8888/nbconvert/html/Assignment.ipynb?download=false 8/8

You might also like