Pandas Adding - Deleting columns and Index Operations. The following shows how to add column, delete column from pandas DataFrame and various index Operations using pandas module.
In [1]:
import pandas as pd
In [2]:
data_list = [0,1,2,3,4,5,6,7,8,9]
data_frame = pd.DataFrame(data_list)
data_frame
Out[2]:
| 0 | |
|---|---|
| 0 | 0 | 
| 1 | 1 | 
| 2 | 2 | 
| 3 | 3 | 
| 4 | 4 | 
| 5 | 5 | 
| 6 | 6 | 
| 7 | 7 | 
| 8 | 8 | 
| 9 | 9 | 
In [3]:
data_frame.columns = ['rev']
data_frame
Out[3]:
| rev | |
|---|---|
| 0 | 0 | 
| 1 | 1 | 
| 2 | 2 | 
| 3 | 3 | 
| 4 | 4 | 
| 5 | 5 | 
| 6 | 6 | 
| 7 | 7 | 
| 8 | 8 | 
| 9 | 9 | 
In [4]:
data_frame['new_col'] = 5
data_frame
Out[4]:
| rev | new_col | |
|---|---|---|
| 0 | 0 | 5 | 
| 1 | 1 | 5 | 
| 2 | 2 | 5 | 
| 3 | 3 | 5 | 
| 4 | 4 | 5 | 
| 5 | 5 | 5 | 
| 6 | 6 | 5 | 
| 7 | 7 | 5 | 
| 8 | 8 | 5 | 
| 9 | 9 | 5 | 
In [5]:
data_frame['new_col'] = data_frame['new_col'] + 1
data_frame
Out[5]:
| rev | new_col | |
|---|---|---|
| 0 | 0 | 6 | 
| 1 | 1 | 6 | 
| 2 | 2 | 6 | 
| 3 | 3 | 6 | 
| 4 | 4 | 6 | 
| 5 | 5 | 6 | 
| 6 | 6 | 6 | 
| 7 | 7 | 6 | 
| 8 | 8 | 6 | 
| 9 | 9 | 6 | 
In [6]:
del data_frame['new_col']
data_frame
Out[6]:
| rev | |
|---|---|
| 0 | 0 | 
| 1 | 1 | 
| 2 | 2 | 
| 3 | 3 | 
| 4 | 4 | 
| 5 | 5 | 
| 6 | 6 | 
| 7 | 7 | 
| 8 | 8 | 
| 9 | 9 | 
In [7]:
data_frame['test_col'] = 3
data_frame['another_col'] = data_frame['rev']
data_frame
Out[7]:
| rev | test_col | another_col | |
|---|---|---|---|
| 0 | 0 | 3 | 0 | 
| 1 | 1 | 3 | 1 | 
| 2 | 2 | 3 | 2 | 
| 3 | 3 | 3 | 3 | 
| 4 | 4 | 3 | 4 | 
| 5 | 5 | 3 | 5 | 
| 6 | 6 | 3 | 6 | 
| 7 | 7 | 3 | 7 | 
| 8 | 8 | 3 | 8 | 
| 9 | 9 | 3 | 9 | 
In [8]:
index = ['a','b','c','d','e','f','g','h','i','j']
data_frame.index = index
data_frame
Out[8]:
| rev | test_col | another_col | |
|---|---|---|---|
| a | 0 | 3 | 0 | 
| b | 1 | 3 | 1 | 
| c | 2 | 3 | 2 | 
| d | 3 | 3 | 3 | 
| e | 4 | 3 | 4 | 
| f | 5 | 3 | 5 | 
| g | 6 | 3 | 6 | 
| h | 7 | 3 | 7 | 
| i | 8 | 3 | 8 | 
| j | 9 | 3 | 9 | 
In [9]:
data_frame.loc['a']
Out[9]:
rev            0
test_col       3
another_col    0
Name: a, dtype: int64
In [10]:
data_frame.loc['a':'d']
Out[10]:
| rev | test_col | another_col | |
|---|---|---|---|
| a | 0 | 3 | 0 | 
| b | 1 | 3 | 1 | 
| c | 2 | 3 | 2 | 
| d | 3 | 3 | 3 | 
In [11]:
data_frame.iloc[0:4]
Out[11]:
| rev | test_col | another_col | |
|---|---|---|---|
| a | 0 | 3 | 0 | 
| b | 1 | 3 | 1 | 
| c | 2 | 3 | 2 | 
| d | 3 | 3 | 3 | 
In [12]:
data_frame['rev']
Out[12]:
a    0
b    1
c    2
d    3
e    4
f    5
g    6
h    7
i    8
j    9
Name: rev, dtype: int64
In [13]:
data_frame[['rev', 'test_col']]
Out[13]:
| rev | test_col | |
|---|---|---|
| a | 0 | 3 | 
| b | 1 | 3 | 
| c | 2 | 3 | 
| d | 3 | 3 | 
| e | 4 | 3 | 
| f | 5 | 3 | 
| g | 6 | 3 | 
| h | 7 | 3 | 
| i | 8 | 3 | 
| j | 9 | 3 | 
In [14]:
data_frame.loc[data_frame.index[0:3], 'rev']
Out[14]:
a    0
b    1
c    2
Name: rev, dtype: int64
In [15]:
data_frame.loc[data_frame.index[0:3], ['rev', 'test_col']]
Out[15]:
| rev | test_col | |
|---|---|---|
| a | 0 | 3 | 
| b | 1 | 3 | 
| c | 2 | 3 | 
In [16]:
data_frame.loc[data_frame.index[5:],'another_col']
Out[16]:
f    5
g    6
h    7
i    8
j    9
Name: another_col, dtype: int64
In [17]:
data_frame.loc[data_frame.index[:3],['another_col', 'test_col']]
Out[17]:
| another_col | test_col | |
|---|---|---|
| a | 0 | 3 | 
| b | 1 | 3 | 
| c | 2 | 3 | 
In [18]:
n = 5
data_frame.head(n)
Out[18]:
| rev | test_col | another_col | |
|---|---|---|---|
| a | 0 | 3 | 0 | 
| b | 1 | 3 | 1 | 
| c | 2 | 3 | 2 | 
| d | 3 | 3 | 3 | 
| e | 4 | 3 | 4 | 
In [19]:
n = 5
data_frame.tail(5)
Out[19]:
| rev | test_col | another_col | |
|---|---|---|---|
| f | 5 | 3 | 5 | 
| g | 6 | 3 | 6 | 
| h | 7 | 3 | 7 | 
| i | 8 | 3 | 8 | 
| j | 9 | 3 | 9 |