Professional Documents
Culture Documents
Data Visualization-05-03
Data Visualization-05-03
In [5]: transactions.info()
<class 'pandas.core.frame.DataFrame'>
RangeIndex: 10 entries, 0 to 9
Data columns (total 5 columns):
# Column Non-Null Count Dtype
--- ------ -------------- -----
0 TransactionID 10 non-null int64
1 TransactionDate 10 non-null object
2 UserID 9 non-null float64
3 ProductID 10 non-null int64
4 Quantity 10 non-null int64
dtypes: float64(1), int64(3), object(1)
memory usage: 532.0+ bytes
In [6]: transactions.shape[0]
Out[6]: 10
In [7]: transactions.shape[1]
Out[7]: 5
In [8]: transactions.index.values
In [9]: transactions.columns.values
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 1/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
0 1 2010-08-21 7.0 2 1
1 2 2011-05-26 3.0 4 1
2 3 2011-06-16 3.0 3 1
3 4 2012-08-26 1.0 2 3
4 5 2013-06-06 2.0 4 1
5 6 2013-12-23 2.0 5 6
6 7 2013-12-30 3.0 4 1
7 8 2014-04-24 NaN 2 3
8 9 2015-04-24 7.0 4 3
9 10 2016-05-08 3.0 4 4
9 10 2016-05-08 3.0 4 4
8 9 2015-04-24 7.0 4 3
7 8 2014-04-24 NaN 2 3
6 7 2013-12-30 3.0 4 1
5 6 2013-12-23 2.0 5 6
4 5 2013-06-06 2.0 4 1
3 4 2012-08-26 1.0 2 3
2 3 2011-06-16 3.0 3 1
1 2 2011-05-26 3.0 4 1
0 1 2010-08-21 7.0 2 1
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 2/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
6 7 2013-12-30 3.0 4 1
4 5 2013-06-06 2.0 4 1
2 3 2011-06-16 3.0 3 1
1 2 2011-05-26 3.0 4 1
0 1 2010-08-21 7.0 2 1
8 9 2015-04-24 7.0 4 3
7 8 2014-04-24 NaN 2 3
3 4 2012-08-26 1.0 2 3
9 10 2016-05-08 3.0 4 4
5 6 2013-12-23 2.0 5 6
0 2 1 2010-08-21 1 7.0
1 4 1 2011-05-26 2 3.0
2 3 1 2011-06-16 3 3.0
3 2 3 2012-08-26 4 1.0
4 4 1 2013-06-06 5 2.0
5 5 6 2013-12-23 6 2.0
6 4 1 2013-12-30 7 3.0
7 2 3 2014-04-24 8 NaN
8 4 3 2015-04-24 9 7.0
9 4 4 2016-05-08 10 3.0
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 3/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
0 7.0 1 2010-08-21 2 1
1 3.0 2 2011-05-26 4 1
2 3.0 3 2011-06-16 3 1
3 1.0 4 2012-08-26 2 3
4 2.0 5 2013-06-06 4 1
5 2.0 6 2013-12-23 5 6
6 3.0 7 2013-12-30 4 1
7 NaN 8 2014-04-24 2 3
8 7.0 9 2015-04-24 4 3
9 3.0 10 2016-05-08 4 4
In [15]: transactions.values[:, 0]
In [16]: transactions.values[:, 0]
In [18]: transactions.iloc[[0,2,5]]
0 1 2010-08-21 7.0 2 1
2 3 2011-06-16 3.0 3 1
5 6 2013-12-23 2.0 5 6
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 4/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
1 2 2011-05-26 3.0 4 1
3 4 2012-08-26 1.0 2 3
4 5 2013-06-06 2.0 4 1
6 7 2013-12-30 3.0 4 1
7 8 2014-04-24 NaN 2 3
8 9 2015-04-24 7.0 4 3
9 10 2016-05-08 3.0 4 4
In [20]: transactions[:3]
transactions.head(3)
0 1 2010-08-21 7.0 2 1
1 2 2011-05-26 3.0 4 1
2 3 2011-06-16 3.0 3 1
In [21]: transactions[3:]
transactions.tail(-3)
3 4 2012-08-26 1.0 2 3
4 5 2013-06-06 2.0 4 1
5 6 2013-12-23 2.0 5 6
6 7 2013-12-30 3.0 4 1
7 8 2014-04-24 NaN 2 3
8 9 2015-04-24 7.0 4 3
9 10 2016-05-08 3.0 4 4
In [22]: transactions.tail(2)
8 9 2015-04-24 7.0 4 3
9 10 2016-05-08 3.0 4 4
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 5/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
In [23]: transactions.tail(-2)
2 3 2011-06-16 3.0 3 1
3 4 2012-08-26 1.0 2 3
4 5 2013-06-06 2.0 4 1
5 6 2013-12-23 2.0 5 6
6 7 2013-12-30 3.0 4 1
7 8 2014-04-24 NaN 2 3
8 9 2015-04-24 7.0 4 3
9 10 2016-05-08 3.0 4 4
3 4 2012-08-26 1.0 2 3
5 6 2013-12-23 2.0 5 6
7 8 2014-04-24 NaN 2 3
8 9 2015-04-24 7.0 4 3
9 10 2016-05-08 3.0 4 4
In [25]: transactions[transactions.UserID == 2]
4 5 2013-06-06 2.0 4 1
5 6 2013-12-23 2.0 5 6
5 6 2013-12-23 2.0 5 6
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 6/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
0 1 2010-08-21 7.0 2 1
1 2 2011-05-26 3.0 4 1
2 3 2011-06-16 3.0 3 1
3 4 2012-08-26 1.0 2 3
5 6 2013-12-23 2.0 5 6
6 7 2013-12-30 3.0 4 1
8 9 2015-04-24 7.0 4 3
9 10 2016-05-08 3.0 4 4
In [28]: foo = np.array([True, False, True, False, True, False, True, False, True, F
transactions[foo]
0 1 2010-08-21 7.0 2 1
2 3 2011-06-16 3.0 3 1
4 5 2013-06-06 2.0 4 1
6 7 2013-12-30 3.0 4 1
8 9 2015-04-24 7.0 4 3
0 1 2010-08-21 7.0 2 1
2 3 2011-06-16 3.0 3 1
3 4 2012-08-26 1.0 2 3
9 10 2016-05-08 3.0 4 4
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 7/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
0 1 2010-08-21 7.0 2 1
1 2 2011-05-26 3.0 4 1
2 3 2011-06-16 3.0 3 1
4 5 2013-06-06 2.0 4 1
5 6 2013-12-23 2.0 5 6
6 7 2013-12-30 3.0 4 1
8 9 2015-04-24 7.0 4 3
3 4 2012-08-26 1.0 2 3
7 8 2014-04-24 NaN 2 3
9 10 2016-05-08 3.0 4 4
0 1 7.0
1 2 3.0
2 3 3.0
3 4 1.0
4 5 2.0
5 6 2.0
6 7 3.0
7 8 NaN
8 9 7.0
9 10 3.0
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 8/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
0 1 2010-08-21
1 2 2011-05-26
2 3 2011-06-16
3 4 2012-08-26
4 5 2013-06-06
5 6 2013-12-23
6 7 2013-12-30
7 8 2014-04-24
8 9 2015-04-24
9 10 2016-05-08
5 6 2013-12-23
6 7 2013-12-30
7 8 2014-04-24
8 9 2015-04-24
9 10 2016-05-08
0 1 7.0 1
1 2 3.0 1
2 3 3.0 1
3 4 1.0 3
4 5 2.0 1
5 6 2.0 6
6 7 3.0 1
7 8 NaN 3
8 9 7.0 3
9 10 3.0 4
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 9/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
0 2010-08-21 2
1 2011-05-26 4
2 2011-06-16 3
3 2012-08-26 2
4 2013-06-06 4
5 2013-12-23 5
6 2013-12-30 4
7 2014-04-24 2
8 2015-04-24 4
9 2016-05-08 4
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 10/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
0 1.0 1
1 2.0 2
2 3.0 4
3 7.0 2
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 11/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
In [52]: transactions[~transactions['UserID'].isin(users['UserID'])]
0 1 2010-08-21 7.0 2 1
7 8 2014-04-24 NaN 2 3
8 9 2015-04-24 7.0 4 3
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 12/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 13/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
0 1 1
1 1 2
2 1 3
3 1 4
4 1 5
5 2 1
6 2 2
7 2 3
8 2 4
9 2 5
10 3 1
11 3 2
12 3 3
13 3 4
14 3 5
15 4 1
16 4 2
17 4 3
18 4 4
19 4 5
20 5 1
21 5 2
22 5 3
23 5 4
24 5 5
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 14/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
0 1 1 0.0
1 1 2 3.0
2 1 3 0.0
3 1 4 0.0
4 1 5 0.0
5 2 1 0.0
6 2 2 0.0
7 2 3 0.0
8 2 4 1.0
9 2 5 6.0
10 3 1 0.0
11 3 2 0.0
12 3 3 1.0
13 3 4 6.0
14 3 5 0.0
15 4 1 0.0
16 4 2 0.0
17 4 3 0.0
18 4 4 0.0
19 4 5 0.0
20 5 1 0.0
21 5 2 0.0
22 5 3 0.0
23 5 4 0.0
24 5 5 0.0
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 15/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
0 1 2010-08-21 7.0 2 1 1
1 1 2010-08-21 7.0 2 1 9
2 9 2015-04-24 7.0 4 3 1
3 9 2015-04-24 7.0 4 3 9
4 2 2011-05-26 3.0 4 1 2
5 2 2011-05-26 3.0 4 1 3
6 2 2011-05-26 3.0 4 1 7
7 2 2011-05-26 3.0 4 1 10
8 3 2011-06-16 3.0 3 1 2
9 3 2011-06-16 3.0 3 1 3
10 3 2011-06-16 3.0 3 1 7
11 3 2011-06-16 3.0 3 1 10
12 7 2013-12-30 3.0 4 1 2
13 7 2013-12-30 3.0 4 1 3
14 7 2013-12-30 3.0 4 1 7
15 7 2013-12-30 3.0 4 1 10
16 10 2016-05-08 3.0 4 4 2
17 10 2016-05-08 3.0 4 4 3
18 10 2016-05-08 3.0 4 4 7
19 10 2016-05-08 3.0 4 4 10
20 4 2012-08-26 1.0 2 3 4
21 5 2013-06-06 2.0 4 1 5
22 5 2013-06-06 2.0 4 1 6
23 6 2013-12-23 2.0 5 6 5
24 6 2013-12-23 2.0 5 6 6
25 8 2014-04-24 NaN 2 3 8
2010-08-
1 2 Pedro male 2010-08-01 5.0 2013-06-06 4.
08
2016-06-
2 3 Caroline female 2012-10-23 2.0 2011-05-26 4.
07
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 16/17
3/8/24, 6:10 PM Data-Visualization-05-03 - Jupyter Notebook
In [78]: transactions
In [ ]:
localhost:8888/notebooks/Data-Visualization-05-03.ipynb 17/17