0% found this document useful (0 votes)

128 views4 pages

Pandas

This document discusses various pandas operations including: - Creating and manipulating pandas Series and DataFrames - Reading and writing CSV files with pandas - Indexing and selecting data from pandas objects - Cleaning and aggregating data in pandas - Merging DataFrames and appending Series to DataFrames

Uploaded by

dashsidd1

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

128 views4 pages

Pandas

Uploaded by

dashsidd1

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 4

Pandas

1. Pandas Data Structures - Hands-on

import pandas as pd
import numpy as np

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']
print(heights_A.shape)
weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])
weights_A.index = ['s1', 's2', 's3', 's4','s5']
print(weights_A.dtype)
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A
print(df_A.shape)
np.random.seed(100)
x=np.random.normal(loc=170.0,scale=25.0,size=5)
np.random.seed(100)
heights_B=pd.Series(x,index=['s1','s2','s3','s4','s5'])
np.random.seed(100)
y=np.random.normal(loc=75.0,scale=12.0,size=5)
weights_B=pd.Series(y,index=['s1','s2','s3','s4','s5'])
print(heights_B.mean())
df_B = pd.DataFrame({'Student_height': heights_B,'Student_weight':weights_B}, index
= weights_B.index)
print(df_B.columns)

2. Working with CSVs

import pandas as pd
import numpy as np
import os

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']
print(heights_A.shape)
weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])
weights_A.index = ['s1', 's2', 's3', 's4','s5']
print(weights_A.dtype)
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A
df_A.to_csv('classA.csv')
os.system("cat classA.csv")
df_A2=pd.read_csv('classA.csv')
print(df_A2)
df_A3=pd.read_csv("classA.csv", index_col=0)
print(df_A3)
np.random.seed(100)
x=np.random.normal(loc=170.0,scale=25.0,size=5)
np.random.seed(100)
heights_B=pd.Series(x,index=['s1','s2','s3','s4','s5'])
np.random.seed(100)
y=np.random.normal(loc=75.0,scale=12.0,size=5)
weights_B=pd.Series(y,index=['s1','s2','s3','s4','s5'])
df_B = pd.DataFrame({'Student_height': heights_B,'Student_weight':weights_B}, index
= weights_B.index)
df_B.to_csv("classB.csv",index=False)
os.system("cat classB.csv")

df_B2=pd.read_csv("classB.csv")
print(df_B2)

df_B3=pd.read_csv("classB.csv", header=None)
print(df_B3)

df_B4=pd.read_csv("classB.csv", header=None, skiprows=2)

print(df_B4)

3. Hands-on with Indexes

import pandas as pd

dates = pd.date_range(start= '2017/09/01', end='2017/09/15')

print(dates[2])
datelist = ['14-Sep-2017', '9-Sep-2017']
dates_to_be_searched = pd.to_datetime(datelist)
print(dates_to_be_searched)
print(dates_to_be_searched.isin(dates))
arraylist = [['classA']*5 + ['classB']*5, ['s1', 's2', 's3', 's4', 's5']*2]

mi_index = pd.MultiIndex.from_arrays(arraylist)
print(mi_index.levels)

4. Access Elements in Data Structures

#Write your code here

import pandas as pd
import numpy as np

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']
print(heights_A[1])
print(heights_A[[1,2,3]])

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

weights_A.index = ['s1', 's2', 's3', 's4','s5']
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A
height = df_A['Student_height']
print(type(height))

df_s1s2 = df_A.iloc[[0,1]]
print(df_s1s2)

df_s2s5s1 = df_A.iloc[[1,4,0]]
print(df_s2s5s1)

df_s1s4 = df_A.loc[(df_A.index.str.endswith('1') | df_A.index.str.endswith('4'))]

print(df_s1s4)

5. Data Cleaning - Handson

#Write your code here

import pandas as pd
import numpy as np

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

weights_A.index = ['s1', 's2', 's3', 's4','s5']
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A

df_A.loc['s3'] = np.nan
df_A.loc['s5'][1]= np.nan

df_A2 = df_A.dropna(how ='any')

print(df_A2)

6. Data Aggregation - Handson

import pandas as pd
import numpy as np

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

weights_A.index = ['s1', 's2', 's3', 's4','s5']
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A

df_A_filter1 = df_A[(df_A.Student_height > 160.0) & (df_A.Student_weight < 80.0)]

print(df_A_filter1)

df_A_filter2 = df_A[df_A.index.isin(['s5'])]
print(df_A_filter2)

df_A['Gender'] = ['M', 'F', 'M', 'M', 'F']

df_groups = df_A.groupby('Gender')
print(df_groups.mean())

import pandas as pd
import numpy as np

nameid = pd.Series(range(101, 111))

name = pd.Series(['person' + str(i) for i in range(1, 11)])
master = pd.DataFrame()
master['nameid'] = nameid
master['name'] = name

transaction = pd.DataFrame({'nameid':[108, 108, 108,103], 'product':['iPhone',

'Nokia', 'Micromax', 'Vivo']})
mdf = pd.merge(master,transaction,on='nameid')
print(mdf)

8.
#Write your code here
import pandas as pd
import numpy as np

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

weights_A.index = ['s1', 's2', 's3', 's4','s5']
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A

df_A['Gender'] = ['M', 'F', 'M', 'M', 'F']

s = pd.Series([165.4, 82.7, 'F'],index=['Student_height', 'Student_weight',
'Gender'],name='s6')

df_AA = df_A.append(s)
print(df_AA)
np.random.seed(100)
x=np.random.normal(loc=170.0,scale=25.0,size=5)
np.random.seed(100)
heights_B=pd.Series(x,index=['s1','s2','s3','s4','s5'])
np.random.seed(100)
y=np.random.normal(loc=75.0,scale=12.0,size=5)
weights_B=pd.Series(y,index=['s1','s2','s3','s4','s5'])
df_B = pd.DataFrame({'Student_height': heights_B,'Student_weight':weights_B}, index
= weights_B.index)
df_B.index = [ 's7', 's8', 's9', 's10', 's11']
df_B['Gender'] = ['F', 'M', 'F', 'F', 'M']

df = pd.concat([df_AA,df_B])
print(df)

Image Processing
No ratings yet
Image Processing
5 pages
NumPy Notes
No ratings yet
NumPy Notes
13 pages
Complete Python With NumPy & Pandas - Naresh-i-Technologies
No ratings yet
Complete Python With NumPy & Pandas - Naresh-i-Technologies
13 pages
HackerRank Python Practice Topics
0% (1)
HackerRank Python Practice Topics
14 pages
Pandas Cheat Sheet PDF
67% (3)
Pandas Cheat Sheet PDF
1 page
Assignment 61
100% (2)
Assignment 61
4 pages
Datascience With Answers
100% (1)
Datascience With Answers
36 pages
HVP 20 4 DA 281 GB Guner Abi
100% (2)
HVP 20 4 DA 281 GB Guner Abi
34 pages
Data Structures in Pandas Solution.: Code
No ratings yet
Data Structures in Pandas Solution.: Code
9 pages
Data Visualization and Matplot
No ratings yet
Data Visualization and Matplot
11 pages
International Indian School, Riyadh WORKSHEET (2020-2021) Grade - Xii - Informatics Practices - Second Term
No ratings yet
International Indian School, Riyadh WORKSHEET (2020-2021) Grade - Xii - Informatics Practices - Second Term
9 pages
Data Analysis With Pandas - Introduction To Pandas Cheatsheet - Codecademy PDF
No ratings yet
Data Analysis With Pandas - Introduction To Pandas Cheatsheet - Codecademy PDF
3 pages
Python Practice Exercise PDF
No ratings yet
Python Practice Exercise PDF
3 pages
Pandas Data Analysis Handbook
No ratings yet
Pandas Data Analysis Handbook
55 pages
Python Revision Tour
No ratings yet
Python Revision Tour
14 pages
Pandas Cheat Sheet
No ratings yet
Pandas Cheat Sheet
2 pages
Python Essentials
No ratings yet
Python Essentials
7 pages
Class XII Data Handlinng Using PandasI
No ratings yet
Class XII Data Handlinng Using PandasI
46 pages
Pandas Practice Questions
No ratings yet
Pandas Practice Questions
2 pages
Python Interview Questions: Answer: in Duck Typing, One Is Concerned With Just Those Aspects of An Object That Are
No ratings yet
Python Interview Questions: Answer: in Duck Typing, One Is Concerned With Just Those Aspects of An Object That Are
12 pages
Worksheet - Pandas
100% (1)
Worksheet - Pandas
16 pages
Top Pandas Functions
No ratings yet
Top Pandas Functions
19 pages
Pandas Complete Notes
No ratings yet
Pandas Complete Notes
105 pages
Python Pandas Demo PDF
100% (2)
Python Pandas Demo PDF
23 pages
DAX Cheat Sheet
No ratings yet
DAX Cheat Sheet
10 pages
Py Spark
No ratings yet
Py Spark
427 pages
Advanced Python
No ratings yet
Advanced Python
204 pages
Python Technical Interviews Questions
100% (1)
Python Technical Interviews Questions
15 pages
This Study Resource Was
No ratings yet
This Study Resource Was
5 pages
21 Machine Learning Using Scikit Learn Ipynb Colaboratory PDF
100% (1)
21 Machine Learning Using Scikit Learn Ipynb Colaboratory PDF
23 pages
Mat Plot Lib
No ratings yet
Mat Plot Lib
44 pages
AWK Command in Unix
No ratings yet
AWK Command in Unix
6 pages
Python Pandas Cheatsheety
No ratings yet
Python Pandas Cheatsheety
7 pages
Python Notes
No ratings yet
Python Notes
49 pages
Python
0% (1)
Python
67 pages
Untitled
100% (1)
Untitled
125 pages
Pandas: Import
100% (1)
Pandas: Import
13 pages
Data Visualization Python Tutorial
No ratings yet
Data Visualization Python Tutorial
9 pages
Pandas Cheat Sheet
No ratings yet
Pandas Cheat Sheet
2 pages
Pytest Documentation: Release 2.7.1
No ratings yet
Pytest Documentation: Release 2.7.1
219 pages
Association Rule Mining Lesson PDF
No ratings yet
Association Rule Mining Lesson PDF
9 pages
Unit 1 - Data Handling Using Pandas and Data Visualisation: Important Multiple Choice Questions
No ratings yet
Unit 1 - Data Handling Using Pandas and Data Visualisation: Important Multiple Choice Questions
6 pages
Pandas Guide
No ratings yet
Pandas Guide
64 pages
Python Date Time
No ratings yet
Python Date Time
6 pages
Python Final Print Vision 22
No ratings yet
Python Final Print Vision 22
112 pages
Data Visualization
No ratings yet
Data Visualization
9 pages
SQL Database Notes
No ratings yet
SQL Database Notes
8 pages
STAT 451: Intro To Machine Learning Lecture Notes
100% (1)
STAT 451: Intro To Machine Learning Lecture Notes
17 pages
Numpy Interview Questions: Click Here
No ratings yet
Numpy Interview Questions: Click Here
32 pages
Python Revision Material - CH.1,2.3.5.9
No ratings yet
Python Revision Material - CH.1,2.3.5.9
31 pages
Python Pandas
100% (1)
Python Pandas
35 pages
Strings PDF
No ratings yet
Strings PDF
14 pages
Structure Query Language (SQL)
No ratings yet
Structure Query Language (SQL)
112 pages
Day64 - Pandas Interview Questions
No ratings yet
Day64 - Pandas Interview Questions
5 pages
Pandas Dataframe
No ratings yet
Pandas Dataframe
48 pages
Python
No ratings yet
Python
35 pages
Introduction To Data Visualization in Python
No ratings yet
Introduction To Data Visualization in Python
16 pages
Python Practice Problems List
No ratings yet
Python Practice Problems List
4 pages
Python Interview Questions You'll Most Likely Be Asked
From Everand
Python Interview Questions You'll Most Likely Be Asked
Vibrant Publishers
2/5 (1)
Python Interview Questions
From Everand
Python Interview Questions
equitypress
4.5/5 (6)
Google Cloud Platform Complete Self-Assessment Guide
From Everand
Google Cloud Platform Complete Self-Assessment Guide
Gerardus Blokdyk
1/5 (1)
01 Cbs - Dec012016 (1) Features & Control
No ratings yet
01 Cbs - Dec012016 (1) Features & Control
72 pages
Lis-02-Three Months Rolling Programme
No ratings yet
Lis-02-Three Months Rolling Programme
9 pages
ML Project Report
No ratings yet
ML Project Report
16 pages
A User-Friendly Assessment Tool For Museum Storage
No ratings yet
A User-Friendly Assessment Tool For Museum Storage
11 pages
C# From A Java Developer's
No ratings yet
C# From A Java Developer's
83 pages
Audio Catalogue: We Supply Sound
No ratings yet
Audio Catalogue: We Supply Sound
64 pages
18 Series Rev C Installation and Operation PDF
No ratings yet
18 Series Rev C Installation and Operation PDF
256 pages
Entrepreneurship
No ratings yet
Entrepreneurship
12 pages
Final Internship Report Summer
0% (2)
Final Internship Report Summer
23 pages
MSME Notification_25032025_Highlighted
No ratings yet
MSME Notification_25032025_Highlighted
2 pages
Tenants Rights
No ratings yet
Tenants Rights
36 pages
Portable Turbidity Meter: Features
No ratings yet
Portable Turbidity Meter: Features
1 page
Servo Mr-E-A-Ag PDF
0% (1)
Servo Mr-E-A-Ag PDF
310 pages
Goel Institute of Technology & Management, Lucknow KMBHR04 - Strategic Human Resource Management 2 Sessional Exam - MCQ Time: 10:00am-1pm Marks: 60
No ratings yet
Goel Institute of Technology & Management, Lucknow KMBHR04 - Strategic Human Resource Management 2 Sessional Exam - MCQ Time: 10:00am-1pm Marks: 60
7 pages
Red Cross Youth: About RCY
No ratings yet
Red Cross Youth: About RCY
6 pages
Class Xii Maths Answer Key Setb
No ratings yet
Class Xii Maths Answer Key Setb
11 pages
Sufficiency Strategy
No ratings yet
Sufficiency Strategy
17 pages
NIT TPSODL - OT - 2023-24 - 012 - Survey, Collection & Disconnection Activities
No ratings yet
NIT TPSODL - OT - 2023-24 - 012 - Survey, Collection & Disconnection Activities
71 pages
NT2580, Week 1 Worksheet 1
No ratings yet
NT2580, Week 1 Worksheet 1
2 pages
Tugas 1 - Silicon-Nitride Ceramics
No ratings yet
Tugas 1 - Silicon-Nitride Ceramics
31 pages
Boy Scouts of The Phils Vs - Coa, GR 177131, June 7, 2011 DIGEST
No ratings yet
Boy Scouts of The Phils Vs - Coa, GR 177131, June 7, 2011 DIGEST
3 pages
Telecommande Temium F BW0392 Manual
0% (2)
Telecommande Temium F BW0392 Manual
34 pages
BNI - THE PSYCHOLOGY OF GIVERS GAIN' by Sudip Mukerjee
No ratings yet
BNI - THE PSYCHOLOGY OF GIVERS GAIN' by Sudip Mukerjee
2 pages
Perimeter Length: 560m: QTY Unit U-Cost Amount Description I. Preliminaries
No ratings yet
Perimeter Length: 560m: QTY Unit U-Cost Amount Description I. Preliminaries
1 page
Topic-: Social Cost Benefit Analysis, UNIDO Approach, Shadow Pricing
No ratings yet
Topic-: Social Cost Benefit Analysis, UNIDO Approach, Shadow Pricing
23 pages
Brochure PDF
No ratings yet
Brochure PDF
8 pages
Computer Accounting With Sage 50 Complete Accounting 2013 17th Edition Carol Yacht Solutions Manual
No ratings yet
Computer Accounting With Sage 50 Complete Accounting 2013 17th Edition Carol Yacht Solutions Manual
48 pages
SDS - EU - EN - Nitric Acid 65%
No ratings yet
SDS - EU - EN - Nitric Acid 65%
26 pages
"2020" Seminar Information: FORD 6R140W - 6R80
No ratings yet
"2020" Seminar Information: FORD 6R140W - 6R80
4 pages

Uploaded by

Uploaded by

Pandas

1. Pandas Data Structures - Hands-on

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

2. Working with CSVs

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

df_B4=pd.read_csv("classB.csv", header=None, skiprows=2)

3. Hands-on with Indexes

dates = pd.date_range(start= '2017/09/01', end='2017/09/15')

4. Access Elements in Data Structures

#Write your code here

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

df_s1s4 = df_A.loc[(df_A.index.str.endswith('1') | df_A.index.str.endswith('4'))]

5. Data Cleaning - Handson

#Write your code here

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

df_A2 = df_A.dropna(how ='any')

6. Data Aggregation - Handson

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

df_A_filter1 = df_A[(df_A.Student_height > 160.0) & (df_A.Student_weight < 80.0)]

df_A['Gender'] = ['M', 'F', 'M', 'M', 'F']

nameid = pd.Series(range(101, 111))

transaction = pd.DataFrame({'nameid':[108, 108, 108,103], 'product':['iPhone',

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

df_A['Gender'] = ['M', 'F', 'M', 'M', 'F']

You might also like