Professional Documents
Culture Documents
Mcdonald - Jupyter Notebook
Mcdonald - Jupyter Notebook
In [1]:
import numpy as np
import pandas as pd
import os
import seaborn as sns
%matplotlib inline
pd.set_option('display.float_format', lambda x: '%.2f' % x)
import scipy.stats as stats
import matplotlib.pyplot as plt
In [2]:
df = pd.read_csv('Mcdonald .csv')
In [3]:
df.head()
Out[3]:
Total Saturated
Serving Calories Total Fat (% Saturated Fat (% Trans
Category Item Calories
Size from Fat Fat Daily Fat Daily Fat
Value) Value)
Egg 4.8 oz
0 Breakfast 300 120 13.00 20 5.00 25 0.00
McMuffin (136 g)
Egg
4.8 oz
1 Breakfast White 250 70 8.00 12 3.00 15 0.00
(135 g)
Delight
Sausage 3.9 oz
2 Breakfast 370 200 23.00 35 8.00 42 0.00
McMuffin (111 g)
Sausage
5.7 oz
3 Breakfast McMuffin 450 250 28.00 43 10.00 52 0.00
(161 g)
with Egg
Sausage
McMuffin 5.7 oz
4 Breakfast 400 210 23.00 35 8.00 42 0.00
with Egg (161 g)
Whites
5 rows × 24 columns
localhost:8888/notebooks/Downloads/Mcdonald.ipynb 1/10
11/2/21, 4:45 PM Mcdonald - Jupyter Notebook
In [4]:
df.describe().T
Out[4]:
Calories from Fat 260.00 127.10 127.88 0.00 20.00 100.00 200.00 1060.00
Total Fat 260.00 14.17 14.21 0.00 2.38 11.00 22.25 118.00
Total Fat (% Daily Value) 260.00 21.82 21.89 0.00 3.75 17.00 35.00 182.00
Saturated Fat 260.00 6.01 5.32 0.00 1.00 5.00 10.00 20.00
Saturated Fat (% Daily Value) 260.00 29.97 26.64 0.00 4.75 24.00 48.00 102.00
Trans Fat 260.00 0.20 0.43 0.00 0.00 0.00 0.00 2.50
Cholesterol (% Daily Value) 260.00 18.39 29.09 0.00 2.00 11.00 21.25 192.00
Sodium (% Daily Value) 260.00 20.68 24.03 0.00 4.75 8.00 36.25 150.00
Carbohydrates (% Daily Value) 260.00 15.78 9.42 0.00 10.00 15.00 20.00 47.00
Dietary Fiber 260.00 1.63 1.57 0.00 0.00 1.00 3.00 7.00
Dietary Fiber (% Daily Value) 260.00 6.53 6.31 0.00 0.00 5.00 10.00 28.00
Vitamin A (% Daily Value) 260.00 13.43 24.37 0.00 2.00 8.00 15.00 170.00
Vitamin C (% Daily Value) 260.00 8.53 26.35 0.00 0.00 0.00 4.00 240.00
Calcium (% Daily Value) 260.00 20.97 17.02 0.00 6.00 20.00 30.00 70.00
Iron (% Daily Value) 260.00 7.73 8.72 0.00 0.00 4.00 15.00 40.00
localhost:8888/notebooks/Downloads/Mcdonald.ipynb 2/10
11/2/21, 4:45 PM Mcdonald - Jupyter Notebook
In [5]:
df.info()
<class 'pandas.core.frame.DataFrame'>
In [6]:
df['Category'].value_counts()
Out[6]:
Breakfast 42
Beverages 27
Desserts 7
Salads 6
localhost:8888/notebooks/Downloads/Mcdonald.ipynb 3/10
11/2/21, 4:45 PM Mcdonald - Jupyter Notebook
In [7]:
plt.figure(figsize=(18,9))
df['Category'].hist()
Out[7]:
<AxesSubplot:>
In [8]:
plt.figure(figsize=(18,9))
sns.boxplot(data=df[['Calories', 'Calories from Fat','Total Fat','Saturated Fat']]);
localhost:8888/notebooks/Downloads/Mcdonald.ipynb 4/10
11/2/21, 4:45 PM Mcdonald - Jupyter Notebook
In [9]:
Correlation = df.corr()
Correlation
Out[9]:
Total Saturated
Chol
Calories Total Fat (% Saturated Fat (% Trans
Calories Cholesterol (%
from Fat Fat Daily Fat Daily Fat
Value) Value)
Calories from
0.90 1.00 1.00 1.00 0.85 0.85 0.43 0.68
Fat
Total Fat 0.90 1.00 1.00 1.00 0.85 0.85 0.43 0.68
Total Fat (%
0.90 1.00 1.00 1.00 0.85 0.85 0.43 0.68
Daily Value)
Saturated Fat 0.85 0.85 0.85 0.85 1.00 1.00 0.62 0.63
Saturated Fat
(% Daily 0.85 0.85 0.85 0.85 1.00 1.00 0.62 0.63
Value)
Trans Fat 0.52 0.43 0.43 0.43 0.62 0.62 1.00 0.25
Cholesterol (%
0.60 0.68 0.68 0.68 0.63 0.63 0.25 1.00
Daily Value)
Sodium (%
0.71 0.85 0.85 0.85 0.59 0.59 0.19 0.62
Daily Value)
Carbohydrates
(% Daily 0.78 0.46 0.46 0.46 0.59 0.59 0.46 0.27
Value)
Dietary Fiber 0.54 0.58 0.58 0.58 0.35 0.36 0.05 0.44
Dietary Fiber
(% Daily 0.54 0.58 0.58 0.58 0.35 0.35 0.06 0.44
Value)
Vitamin A (%
0.11 0.06 0.05 0.05 0.06 0.07 0.08 0.08
Daily Value)
Vitamin C (%
-0.07 -0.09 -0.09 -0.09 -0.18 -0.18 -0.08 -0.08
Daily Value)
Calcium (%
0.43 0.16 0.16 0.16 0.40 0.40 0.39 0.13
Daily Value)
Iron (% Daily
0.64 0.74 0.73 0.74 0.58 0.58 0.33 0.65
Value)
21 rows × 21 columns
localhost:8888/notebooks/Downloads/Mcdonald.ipynb 5/10
11/2/21, 4:45 PM Mcdonald - Jupyter Notebook
In [10]:
plt.figure(figsize=(18,9))
sns.heatmap(Correlation,annot=True)
Out[10]:
<AxesSubplot:>
In [11]:
df['Category'].nunique()
print('The number of Categories is -', df['Category'].nunique())
localhost:8888/notebooks/Downloads/Mcdonald.ipynb 6/10
11/2/21, 4:45 PM Mcdonald - Jupyter Notebook
In [12]:
df['Category'].unique()
from pandas import DataFrame
Category_List = sorted(df['Category'].unique())
type(sorted(df['Category'].unique()))
a = pd.DataFrame(Category_List,columns=[''])
a.index += 1
print('\n \n Let us view the different food categories that are available to us :- \n \n ',
2 Beverages
3 Breakfast
6 Desserts
7 Salads
In [14]:
Out[14]:
Category
Breakfast 50.95
Salads 17.33
Desserts 4.86
Beverages 0.19
In [15]:
df['Item'].nunique()
print('\n \n The different type of Food items available at Mcdonald are -', df['Item'].nuni
localhost:8888/notebooks/Downloads/Mcdonald.ipynb 7/10
11/2/21, 4:45 PM Mcdonald - Jupyter Notebook
In [17]:
df['Item'].head(20)
Out[17]:
0 Egg McMuffin
2 Sausage McMuffin
localhost:8888/notebooks/Downloads/Mcdonald.ipynb 8/10
11/2/21, 4:45 PM Mcdonald - Jupyter Notebook
In [21]:
Out[21]:
Sodium
Item
Big Breakfast with Hotcakes and Egg Whites (Large Biscuit) 2290
Big Breakfast with Hotcakes and Egg Whites (Regular Biscuit) 2170
localhost:8888/notebooks/Downloads/Mcdonald.ipynb 9/10
11/2/21, 4:45 PM Mcdonald - Jupyter Notebook
In [23]:
Out[23]:
Saturated Fat
Item
Big Breakfast with Hotcakes and Egg Whites (Regular Biscuit) 16.00
Big Breakfast with Hotcakes and Egg Whites (Large Biscuit) 16.00
In [ ]:
localhost:8888/notebooks/Downloads/Mcdonald.ipynb 10/10