import seaborn as sns
import pandas as pd

taxis = sns.load_dataset('taxis')
taxis.drop(['passengers', 'distance', 'pickup_zone', 'dropoff_zone'], inplace=True, axis=1)
taxis.head(3)


# bracket notation
taxis['dropoff'].head(3)

0    2019-03-23 20:27:24
1    2019-03-04 16:19:00
2    2019-03-27 18:00:25
Name: dropoff, dtype: object


# dot notation
taxis.dropoff.head(3)

0    2019-03-23 20:27:24
1    2019-03-04 16:19:00
2    2019-03-27 18:00:25
Name: dropoff, dtype: object


my_cols = ['fare', 'total', 'pickup_borough']
taxis[my_cols].head(3)


taxis.columns

Index(['pickup', 'dropoff', 'fare', 'tip', 'tolls', 'total', 'color',
       'payment', 'pickup_borough', 'dropoff_borough'],
      dtype='object')


col7 = taxis.columns[7]
taxis[col7].head(3)

0    credit card
1           cash
2    credit card
Name: payment, dtype: object


cols = taxis.columns[3:7]
taxis[cols].head(3)


my_cols = ['fare', 'total', 'pickup_borough']
taxis.loc[:, my_cols].head(3)


taxis.iloc[:, 3:7].head(3)


(taxis == 7).any().values

array([False, False,  True,  True, False,  True, False, False, False,
       False])


selection = (taxis == 7).any()
taxis.loc[:, selection].head(3)


taxis_sel = taxis.select_dtypes(include=['float64']) # select floats only
selection = ((taxis_sel >= 10) | (taxis_sel <= 30)).any()
taxis_sel.loc[:, selection].head(3)


cols_list = ['pickup_borough', 'other_col_name', 'fare']
taxis.loc[:, taxis.columns.isin(cols_list)].head(3)


taxis['id'] = 'id'
taxis.reset_index(level=0, inplace=True)
taxis['index'] = taxis['id'] + '_' +  taxis['index'].astype(str)
taxis.drop('id', axis=1, inplace=True)
taxis.set_index('index', drop=True, inplace=True)
taxis.head(3)


taxis.loc['id_2',:]

pickup             2019-03-27 17:53:01
dropoff            2019-03-27 18:00:25
fare                               7.5
tip                               2.36
tolls                              0.0
total                            14.16
color                           yellow
payment                    credit card
pickup_borough               Manhattan
dropoff_borough              Manhattan
Name: id_2, dtype: object


taxis.loc[['id_2', 'id_6'],:]


taxis.iloc[2,:]

pickup             2019-03-27 17:53:01
dropoff            2019-03-27 18:00:25
fare                               7.5
tip                               2.36
tolls                              0.0
total                            14.16
color                           yellow
payment                    credit card
pickup_borough               Manhattan
dropoff_borough              Manhattan
Name: id_2, dtype: object


taxis.iloc[[2,6],:]


mask = (taxis['payment'] == 'credit card')
taxis.loc[mask].head(3)


mask = (taxis['payment'] == 'credit card') & (taxis['color'] == 'green')
taxis.loc[mask].head(3)


mask = taxis['pickup_borough'].isin(['Manhattan', 'Queens'])
taxis.loc[mask]


taxis.query("pickup_borough == 'Manhattan' | pickup_borough == 'Queens'")

Selecting Columns And Filtering Rows In Pandas

Selecting Columns¶

Selecting one column¶

Selecting multiple columns¶

Selecting columns using the columns parameter¶

Selecting columns using loc[]¶

Selecting columns using iloc[]¶

Selecting columns, by values in the columns, using any()¶

Selecting columns by column name using isin() and columns¶

Filtering rows¶

Selecting one row with loc¶

Selecting multiple rows with loc¶

Selecting rows with iloc¶

Selecting multiple rows with iloc¶

Selecting rows by the values in a column with one condition¶

Selecting rows by the values in a column with multiple conditions¶

Using isin, multiple values in one column¶

Selecting rows using query()¶

Conclusion¶

	pickup	dropoff	fare	tip	total	color	payment	pickup_borough	dropoff_borough
0	2019-03-23 20:21:09	2019-03-23 20:27:24	7.0	2.15	12.95	yellow	credit card	Manhattan	Manhattan
1	2019-03-04 16:11:55	2019-03-04 16:19:00	5.0	0.00	9.30	yellow	cash	Manhattan	Manhattan
2	2019-03-27 17:53:01	2019-03-27 18:00:25	7.5	2.36	14.16	yellow	credit card	Manhattan	Manhattan

	pickup	dropoff	fare	tip	tolls	total	color	payment	pickup_borough	dropoff_borough
index
id_0	2019-03-23 20:21:09	2019-03-23 20:27:24	7.0	2.15	0.0	12.95	yellow	credit card	Manhattan	Manhattan
id_1	2019-03-04 16:11:55	2019-03-04 16:19:00	5.0	0.00	0.0	9.30	yellow	cash	Manhattan	Manhattan
id_2	2019-03-27 17:53:01	2019-03-27 18:00:25	7.5	2.36	0.0	14.16	yellow	credit card	Manhattan	Manhattan

	pickup	dropoff	fare	tip	tolls	total	color	payment	pickup_borough	dropoff_borough
index
id_5452	2019-03-14 22:04:04	2019-03-14 22:10:00	5.50	0.0	0.00	6.80	green	credit card	Queens	Queens
id_5453	2019-03-29 18:12:27	2019-03-29 18:20:40	7.50	1.2	0.00	10.50	green	credit card	Manhattan	Manhattan
id_5456	2019-03-12 21:11:03	2019-03-12 21:41:36	42.82	0.0	5.76	49.08	green	credit card	Queens	Manhattan