Pandas
data:image/s3,"s3://crabby-images/4cdb8/4cdb8e6faecc84cfced5cf00f8260d6db4a5bf75" alt="DataFrame in Pandas DataFrame in Pandas"
DataFrame in Pandas
A data frame is a two-dimensional tabular labeled data structure with columns of potentially different types. A data frame can be created from numerous data collections such as the following:
- A 1D ndarray, list, dict, or series
- 2D Numpy ndarray
- Structured or record ndarray
- A series
- Another data frame
A data frame has arguments, which are an index (row labels) and columns (column labels).
Creating Dataframe from dictionary of series
#import necessary library
import pandas as pd
#First Series
Maths = pd.Series([10,20,30,40,50],index=['Arima','Pluto','Neptune','Zahir','Javed'])
#Second Series
Japanese = pd.Series([20,50,80,12],index=['Arima','Pluto','Zahir','Javed'])
#Dictionary of Series
Marks = {'Maths':Maths,'Japanese':Japanese}
#Dataframe from series
df = pd.DataFrame(Marks)
#Printing Dataframe
df
data:image/s3,"s3://crabby-images/cd847/cd84740d5b29bb5beb770a37d03b9ac43df73f42" alt=""
#Set index for the DataFrame
pd.DataFrame(Marks,index=['Javed','Arima','Pluto'])
data:image/s3,"s3://crabby-images/691d8/691d8ddeb906040440f6bd28cc0bb65f6f06e03f" alt=""
#Control the labels appearence of the DataFrame
pd.DataFrame(Marks,index=['Javed','Arima','Pluto'],columns=['Japanese','Maths'])
data:image/s3,"s3://crabby-images/fad4d/fad4d700b0ac0e985713faffe7405ff96399a6ac" alt=""
Creating DataFrames from a Dict of Ndarrays/Lists
#Without index
ndarrdict = {'One':[1,2,3,4],'Two':[2,4,6,8],'Three':[3,6,9,12]}
pd.DataFrame(ndarrdict)
data:image/s3,"s3://crabby-images/9ed98/9ed983a11f7eba4b67aabf704d9726a0cd94eae0" alt=""
#Assign index
pd.DataFrame(ndarrdict,index=['a','b','c','e'])
data:image/s3,"s3://crabby-images/37379/373791a61fb0297b0c6e175bd388b38839193fd5" alt=""
Creating Data Frames from a Structured or Record Array
import pandas as pd
import numpy as np
#creates a data frame by first specifying the data types of each
#column and then the values of each row. ('A', 'i4') determines the
#column label and its data type as integers, ('B', 'f4') determines the
#label as B and the data type as float, and finally ('C', 'a10') assigns the
#label C and data type as a string with a maximum of ten characters.
data = np.zeros((2,),dtype=[('A','i4'),
('B','f4'),
('C','a10')])
data[:] = [(1,2.,'Hello'),(2,3.3,'World')]
pd.DataFrame(data)
data:image/s3,"s3://crabby-images/88e7b/88e7b00abeda04aaf6d75111fc112cc99334a0cf" alt=""
pd.DataFrame(data, index=['First', 'Second'])
data:image/s3,"s3://crabby-images/00fb2/00fb26b8ec00361abba25e1daee52122c3b3da75" alt=""
pd.DataFrame(data, columns=['C', 'A', 'B'])
data:image/s3,"s3://crabby-images/9ffc4/9ffc4da038486be4894604198a6e69bc224974da" alt=""
Creating Data Frames from a List of Dictionaries
data2 = [{'A': 1, 'B': 2,'C':50}, {'A': 5, 'B': 10, 'C': 20}]
pd.DataFrame(data2)
data:image/s3,"s3://crabby-images/16f04/16f04e3d1df19ea97ddc9028feac4060ff4716a6" alt=""
pd.DataFrame(data2, index=['First', 'Second'])
data:image/s3,"s3://crabby-images/5c6f1/5c6f1806aa57f5e4dfaf0d0823f5f1100b0aa600" alt=""
pd.DataFrame(data2, columns=['A', 'B'])
data:image/s3,"s3://crabby-images/623d4/623d45b1af5a6e3cac91af239ca3059df8e23a99" alt=""
pd.DataFrame(data2, columns=['C', 'B'])
data:image/s3,"s3://crabby-images/ebb98/ebb98eab08c212815aa09923288e66743c85d5a0" alt=""
Creating Data Frames from a Dict of Tuples
dictionary = {'Maths':(1,2,3,5),'Japanese':(55,22,66,99),'Virology':(98,56,23,78)}
pd.DataFrame(dictionary)
data:image/s3,"s3://crabby-images/46028/4602887d5524b8ab5eae99006a7c0aab9e887073" alt=""
pd.DataFrame(dictionary,index=['Roll_1','Roll_2','Roll_3','Roll_4'])
data:image/s3,"s3://crabby-images/adf7e/adf7ec0c7ff6feedbd1dab0fd9303623f41e96c7" alt=""
Creating DataFrame from list of tuples
marks = [(1,2,3,5),(55,22,66,99),(98,56,23,78)]
pd.DataFrame(marks)
data:image/s3,"s3://crabby-images/4d5a2/4d5a25937ab97d62b73cbd75c60ef840f4b7b125" alt=""
pd.DataFrame(marks,columns=['A', 'B', 'C','D'])
data:image/s3,"s3://crabby-images/4f61d/4f61d442e8d214bf3647b7842ce06db64798d19d" alt=""
pd.DataFrame(marks,columns=['A', 'B', 'C','D'],index=['AA','BB','CC'])
data:image/s3,"s3://crabby-images/8fa40/8fa40be05fd81338b4fc993f213324e3a07c0e3f" alt=""
Selecting, Adding, and Deleting Data Frame Columns
expense = {'Food':[50,20,63,98],'Travel':[55,98,78,45]}
df = pd.DataFrame(expense)
df
data:image/s3,"s3://crabby-images/45b71/45b71da38d28079b26a941db097ce6471f5988c0" alt=""
df['Total'] = df['Food']+df['Travel']
df
data:image/s3,"s3://crabby-images/eaf04/eaf04eb3ae65ac85df104052be50d04b4a5dddf8" alt=""
#using condition
df['Flag'] = df['Total'] > 110
df
data:image/s3,"s3://crabby-images/c1fff/c1fff41a2ec88d5316ac2dc7dcc8df8ace681a40" alt=""
#Adding a Column Using a Scalar and Assigning to a Data Frame
df['Filler'] = 'HCT'
df['Slic'] = df['Food'][:2]
df
data:image/s3,"s3://crabby-images/43252/4325207ebccf2f77a32752b4a174475fe788cb72" alt=""
#Delete Columns
del df['Filler']
df
data:image/s3,"s3://crabby-images/1e904/1e904794495b108da4947e4c386f3402b507d4d3" alt=""
Flag = df.pop('Flag')
df
data:image/s3,"s3://crabby-images/94114/941142699849d37ec6296cd6853e3240aed474b6" alt=""
df.insert(0,'Education',[52,26,89,74])
df
data:image/s3,"s3://crabby-images/10107/101079c41f92fd0d9b05d27aede8fefc12d22c95" alt=""
#Assigning New Columns in Method Chains
df = pd.DataFrame({'Maths':[1,25,56],'Japanese':[88,96,54]})
df = df.assign(Total=lambda x : x['Maths']+x['Japanese'])
df = df.assign(Flaf = lambda x:x['Maths']>x['Japanese'])
df
data:image/s3,"s3://crabby-images/08720/08720dcf1824e078fecf1e38ffcbdcceb14da5bc" alt=""
df = df.assign(Sq = lambda x:x['Maths']*2)
df
data:image/s3,"s3://crabby-images/4b930/4b9304befd09db206025a83b27d1a54a41923584" alt=""
Indexing and Selecting Data Frames
df = pd.DataFrame({'Maths':[1,25,56],'Japanese':[88,96,54],
'Music':[1,15,89],'Virology':[89,57,56]})
df
data:image/s3,"s3://crabby-images/8f828/8f828a10860d990540996e20bb21f9ada2348109" alt=""
df['Maths']
data:image/s3,"s3://crabby-images/660f8/660f8ac000046a44c12f47dbed2f3445b2053927" alt=""
df.iloc[2]
data:image/s3,"s3://crabby-images/a877d/a877da7870e03f8f1243a5f7ad92731402d2908a" alt=""
df[1:]
data:image/s3,"s3://crabby-images/0a371/0a37164f3395a4b183e6271906bfbef8c9d58584" alt=""
df[df['Maths']>10]
data:image/s3,"s3://crabby-images/12f65/12f65f36c36fcc0e48d8a3a8a71da070edea64a0" alt=""
#Operation on Dataframes
df1 = pd.DataFrame({"A":[1,2,3],"B":[4,7,8],"C":[9,5,8]})
df2 = pd.DataFrame({"A":[111,2,33],"B":[46,7,68],"C":[69,5,98]})
df1
data:image/s3,"s3://crabby-images/4f694/4f6940f981aa385cf7802dadd41bba9c7006ad3a" alt=""
df2
data:image/s3,"s3://crabby-images/49b3d/49b3dfd4c00a5ada37028230143ad016f2eba8a9" alt=""
df1+df2
data:image/s3,"s3://crabby-images/54939/54939b2d8d5feaf69598099574f91d17cb203be3" alt=""
df1-df2
data:image/s3,"s3://crabby-images/954c7/954c76a8041721ca51ab961501f246bd940d8df2" alt=""
df2-df1.iloc[1]
data:image/s3,"s3://crabby-images/371ca/371ca329bb8e21a89eb081aaf0404b6eac6cc36b" alt=""
df2*2+1
data:image/s3,"s3://crabby-images/2cda7/2cda7746d6af4dabaed0406a5055fac2848e5aae" alt=""
Transposing a DataFrame
df = pd.DataFrame({'Maths':[1,25,56],'Japanese':[88,96,54],
'Music':[1,15,89],'Virology':[89,57,56]})
df
data:image/s3,"s3://crabby-images/7a424/7a4244c1ab50c51592c054ce83b065520f0ddb43" alt=""
df.T
data:image/s3,"s3://crabby-images/60d84/60d848c1cc9b8e49590381c9f9ff74b4637b4c60" alt=""
DataFrame interoperability with numpy functions
import pandas as pd
import numpy as np
df = pd.DataFrame({'Maths':[1,25,56],'Japanese':[88,96,54],
'Music':[1,15,89],'Virology':[89,57,56]})
df.T.dot(df)
data:image/s3,"s3://crabby-images/fd946/fd9460dbdbcddd012eb971103b3b1c5244fa5958" alt=""
ponru
0