0% found this document useful (0 votes)

141 views4 pages

Pandas

This document discusses various pandas operations including: - Creating and manipulating pandas Series and DataFrames - Reading and writing CSV files with pandas - Indexing and selecting data from pandas objects - Cleaning and aggregating data in pandas - Merging DataFrames and appending Series to DataFrames

Uploaded by

dashsidd1

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

141 views4 pages

Pandas

Uploaded by

dashsidd1

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 4

Pandas

1. Pandas Data Structures - Hands-on

import pandas as pd
import numpy as np

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']
print(heights_A.shape)
weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])
weights_A.index = ['s1', 's2', 's3', 's4','s5']
print(weights_A.dtype)
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A
print(df_A.shape)
np.random.seed(100)
x=np.random.normal(loc=170.0,scale=25.0,size=5)
np.random.seed(100)
heights_B=pd.Series(x,index=['s1','s2','s3','s4','s5'])
np.random.seed(100)
y=np.random.normal(loc=75.0,scale=12.0,size=5)
weights_B=pd.Series(y,index=['s1','s2','s3','s4','s5'])
print(heights_B.mean())
df_B = pd.DataFrame({'Student_height': heights_B,'Student_weight':weights_B}, index
= weights_B.index)
print(df_B.columns)

2. Working with CSVs

import pandas as pd
import numpy as np
import os

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']
print(heights_A.shape)
weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])
weights_A.index = ['s1', 's2', 's3', 's4','s5']
print(weights_A.dtype)
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A
df_A.to_csv('classA.csv')
os.system("cat classA.csv")
df_A2=pd.read_csv('classA.csv')
print(df_A2)
df_A3=pd.read_csv("classA.csv", index_col=0)
print(df_A3)
np.random.seed(100)
x=np.random.normal(loc=170.0,scale=25.0,size=5)
np.random.seed(100)
heights_B=pd.Series(x,index=['s1','s2','s3','s4','s5'])
np.random.seed(100)
y=np.random.normal(loc=75.0,scale=12.0,size=5)
weights_B=pd.Series(y,index=['s1','s2','s3','s4','s5'])
df_B = pd.DataFrame({'Student_height': heights_B,'Student_weight':weights_B}, index
= weights_B.index)
df_B.to_csv("classB.csv",index=False)
os.system("cat classB.csv")

df_B2=pd.read_csv("classB.csv")
print(df_B2)

df_B3=pd.read_csv("classB.csv", header=None)
print(df_B3)

df_B4=pd.read_csv("classB.csv", header=None, skiprows=2)

print(df_B4)

3. Hands-on with Indexes

import pandas as pd

dates = pd.date_range(start= '2017/09/01', end='2017/09/15')

print(dates[2])
datelist = ['14-Sep-2017', '9-Sep-2017']
dates_to_be_searched = pd.to_datetime(datelist)
print(dates_to_be_searched)
print(dates_to_be_searched.isin(dates))
arraylist = [['classA']*5 + ['classB']*5, ['s1', 's2', 's3', 's4', 's5']*2]

mi_index = pd.MultiIndex.from_arrays(arraylist)
print(mi_index.levels)

4. Access Elements in Data Structures

#Write your code here

import pandas as pd
import numpy as np

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']
print(heights_A[1])
print(heights_A[[1,2,3]])

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

weights_A.index = ['s1', 's2', 's3', 's4','s5']
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A
height = df_A['Student_height']
print(type(height))

df_s1s2 = df_A.iloc[[0,1]]
print(df_s1s2)

df_s2s5s1 = df_A.iloc[[1,4,0]]
print(df_s2s5s1)

df_s1s4 = df_A.loc[(df_A.index.str.endswith('1') | df_A.index.str.endswith('4'))]

print(df_s1s4)

5. Data Cleaning - Handson

#Write your code here

import pandas as pd
import numpy as np

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

weights_A.index = ['s1', 's2', 's3', 's4','s5']
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A

df_A.loc['s3'] = np.nan
df_A.loc['s5'][1]= np.nan

df_A2 = df_A.dropna(how ='any')

print(df_A2)

6. Data Aggregation - Handson

import pandas as pd
import numpy as np

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

weights_A.index = ['s1', 's2', 's3', 's4','s5']
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A

df_A_filter1 = df_A[(df_A.Student_height > 160.0) & (df_A.Student_weight < 80.0)]

print(df_A_filter1)

df_A_filter2 = df_A[df_A.index.isin(['s5'])]
print(df_A_filter2)

df_A['Gender'] = ['M', 'F', 'M', 'M', 'F']

df_groups = df_A.groupby('Gender')
print(df_groups.mean())

import pandas as pd
import numpy as np

nameid = pd.Series(range(101, 111))

name = pd.Series(['person' + str(i) for i in range(1, 11)])
master = pd.DataFrame()
master['nameid'] = nameid
master['name'] = name

transaction = pd.DataFrame({'nameid':[108, 108, 108,103], 'product':['iPhone',

'Nokia', 'Micromax', 'Vivo']})
mdf = pd.merge(master,transaction,on='nameid')
print(mdf)

8.
#Write your code here
import pandas as pd
import numpy as np

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

heights_A.index = ['s1', 's2', 's3', 's4','s5']

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

weights_A.index = ['s1', 's2', 's3', 's4','s5']
df_A = pd.DataFrame()
df_A['Student_height'] = heights_A
df_A['Student_weight'] = weights_A

df_A['Gender'] = ['M', 'F', 'M', 'M', 'F']

s = pd.Series([165.4, 82.7, 'F'],index=['Student_height', 'Student_weight',
'Gender'],name='s6')

df_AA = df_A.append(s)
print(df_AA)
np.random.seed(100)
x=np.random.normal(loc=170.0,scale=25.0,size=5)
np.random.seed(100)
heights_B=pd.Series(x,index=['s1','s2','s3','s4','s5'])
np.random.seed(100)
y=np.random.normal(loc=75.0,scale=12.0,size=5)
weights_B=pd.Series(y,index=['s1','s2','s3','s4','s5'])
df_B = pd.DataFrame({'Student_height': heights_B,'Student_weight':weights_B}, index
= weights_B.index)
df_B.index = [ 's7', 's8', 's9', 's10', 's11']
df_B['Gender'] = ['F', 'M', 'F', 'F', 'M']

df = pd.concat([df_AA,df_B])
print(df)

NumPy, Pandas, MatplotLib, Seaborn, ScikitLearn (SkLearn)
No ratings yet
NumPy, Pandas, MatplotLib, Seaborn, ScikitLearn (SkLearn)
14 pages
Data Visualization Using Matplotlib in Python
No ratings yet
Data Visualization Using Matplotlib in Python
15 pages
Data Mining Using Phyton
No ratings yet
Data Mining Using Phyton
50 pages
Pandas
No ratings yet
Pandas
27 pages
Unit-1 Python Pandas
No ratings yet
Unit-1 Python Pandas
56 pages
Python Libraries
No ratings yet
Python Libraries
17 pages
ARIS PPM System Architecture
100% (1)
ARIS PPM System Architecture
84 pages
Python For Non-Programmers Final
No ratings yet
Python For Non-Programmers Final
218 pages
Unit 5
No ratings yet
Unit 5
27 pages
Jupyter
No ratings yet
Jupyter
17 pages
Python Pandas
100% (1)
Python Pandas
35 pages
Pandas
No ratings yet
Pandas
8 pages
Pandas
No ratings yet
Pandas
14 pages
Python Pandas Handson
No ratings yet
Python Pandas Handson
6 pages
Pandas DataFrame Cheat Sheet
No ratings yet
Pandas DataFrame Cheat Sheet
6 pages
Creating Dataframes Reshaping Data
100% (1)
Creating Dataframes Reshaping Data
2 pages
5 An Hour Betfair Money Machine
75% (4)
5 An Hour Betfair Money Machine
3 pages
Fds Unit - III
No ratings yet
Fds Unit - III
58 pages
Rapids Cheatsheet
100% (1)
Rapids Cheatsheet
2 pages
A Linguagem Da Paz Num Mundo de Conflitos
No ratings yet
A Linguagem Da Paz Num Mundo de Conflitos
181 pages
Python Pandas
No ratings yet
Python Pandas
6 pages
Spectrum Release Notes
No ratings yet
Spectrum Release Notes
11 pages
Predicting Salary with Experience
100% (1)
Predicting Salary with Experience
7 pages
Python Data Analysis Basics
No ratings yet
Python Data Analysis Basics
246 pages
Pandas Course Slides
No ratings yet
Pandas Course Slides
90 pages
Micro Project Report On: Airline Reservation System
100% (1)
Micro Project Report On: Airline Reservation System
17 pages
Python Cheat Sheet For Excel Users
No ratings yet
Python Cheat Sheet For Excel Users
5 pages
Specifications
No ratings yet
Specifications
58 pages
Gamification in Education
No ratings yet
Gamification in Education
8 pages
Pandas Cheat Sheet
No ratings yet
Pandas Cheat Sheet
2 pages
LMRS Ip 2020 21
No ratings yet
LMRS Ip 2020 21
21 pages
Data Analysis With Pandas - Introduction To Pandas Cheatsheet - Codecademy PDF
No ratings yet
Data Analysis With Pandas - Introduction To Pandas Cheatsheet - Codecademy PDF
3 pages
EDA Cheatsheet - Class Note
No ratings yet
EDA Cheatsheet - Class Note
29 pages
Numpy-User-1 10 1
No ratings yet
Numpy-User-1 10 1
107 pages
Automation For The Belt Conveyor System - Formatted Paper
No ratings yet
Automation For The Belt Conveyor System - Formatted Paper
6 pages
Incose SD Sept2019 Presentation Charley Patton Mbse A Practical Approach v01
No ratings yet
Incose SD Sept2019 Presentation Charley Patton Mbse A Practical Approach v01
20 pages
3.menus and Toolbars in WxPython
No ratings yet
3.menus and Toolbars in WxPython
13 pages
One That Follows AP (Availability, Partition)
No ratings yet
One That Follows AP (Availability, Partition)
2 pages
Unix Lab Manual
No ratings yet
Unix Lab Manual
56 pages
Microsoft Corporation's Organizational Culture & Its Characteristics
No ratings yet
Microsoft Corporation's Organizational Culture & Its Characteristics
2 pages
Python Notes For Beginners (Autosaved)
No ratings yet
Python Notes For Beginners (Autosaved)
52 pages
22am901 Data Science Using Python Unit 2
No ratings yet
22am901 Data Science Using Python Unit 2
116 pages
Class XII Data Handlinng Using PandasI
No ratings yet
Class XII Data Handlinng Using PandasI
46 pages
ALD Port Power Failure
No ratings yet
ALD Port Power Failure
1 page
Software Reuse for Developers
No ratings yet
Software Reuse for Developers
9 pages
Python Pandas Demo PDF
100% (2)
Python Pandas Demo PDF
23 pages
Assignment 61
100% (2)
Assignment 61
4 pages
Pandas Series and DataFrame Guide
No ratings yet
Pandas Series and DataFrame Guide
87 pages
Mat Plot Lib
No ratings yet
Mat Plot Lib
44 pages
Pandas
No ratings yet
Pandas
13 pages
Data Wrangling with Pandas
No ratings yet
Data Wrangling with Pandas
16 pages
5BH Ti
No ratings yet
5BH Ti
16 pages
Equip Sim User Manual
No ratings yet
Equip Sim User Manual
131 pages
Pandas 6 1716219621
No ratings yet
Pandas 6 1716219621
17 pages
Emu Log
No ratings yet
Emu Log
253 pages
Geeetech A20M 3D Printer Guide
No ratings yet
Geeetech A20M 3D Printer Guide
56 pages
MyWalboxApp QuickStartGuide EU
No ratings yet
MyWalboxApp QuickStartGuide EU
15 pages
ML Lab1 Python Panda
No ratings yet
ML Lab1 Python Panda
9 pages
Data Visualization and Matplot
No ratings yet
Data Visualization and Matplot
11 pages
Pandas in Python 16sept2022
No ratings yet
Pandas in Python 16sept2022
8 pages
Python Data Visualization Guide
No ratings yet
Python Data Visualization Guide
16 pages
Sax Phone
No ratings yet
Sax Phone
188 pages
Test Management Roles & Responsibilities
No ratings yet
Test Management Roles & Responsibilities
2 pages
Python 3 Beginner's Reference Cheat Sheet: by Via
100% (1)
Python 3 Beginner's Reference Cheat Sheet: by Via
1 page
Python & Pandas Coding Quiz
No ratings yet
Python & Pandas Coding Quiz
2 pages
Tools Machine Learning
No ratings yet
Tools Machine Learning
9 pages
Python - Programming
No ratings yet
Python - Programming
9 pages
Python Date Time
No ratings yet
Python Date Time
6 pages
Pandas vs PySpark: Data Operations
No ratings yet
Pandas vs PySpark: Data Operations
3 pages
Python Numpy (1) : Intro To Multi-Dimensional Array & Numerical Linear Algebra
100% (1)
Python Numpy (1) : Intro To Multi-Dimensional Array & Numerical Linear Algebra
27 pages
1 Pandas Basics
No ratings yet
1 Pandas Basics
13 pages
1 30PM Application of The Autonomous Ground Vehicle Reference Architecture in Model Based Systems Engineering
No ratings yet
1 30PM Application of The Autonomous Ground Vehicle Reference Architecture in Model Based Systems Engineering
12 pages
Assignment MET1233
No ratings yet
Assignment MET1233
12 pages
UCS310
No ratings yet
UCS310
2 pages
Python Basics: Subset Slice
No ratings yet
Python Basics: Subset Slice
1 page
GPT4All Technical Report 3
No ratings yet
GPT4All Technical Report 3
4 pages
New Microsoft Excel Worksheet (2) - 1
No ratings yet
New Microsoft Excel Worksheet (2) - 1
6 pages
Government Scheme Awareness App
No ratings yet
Government Scheme Awareness App
4 pages
International Indian School, Riyadh WORKSHEET (2020-2021) Grade - Xii - Informatics Practices - Second Term
No ratings yet
International Indian School, Riyadh WORKSHEET (2020-2021) Grade - Xii - Informatics Practices - Second Term
9 pages
Heni Kothari: Main Objective
No ratings yet
Heni Kothari: Main Objective
1 page
Smita Deore 1225548570
No ratings yet
Smita Deore 1225548570
2 pages
Research Paper Presentation Pandas Moshiul Arefin
No ratings yet
Research Paper Presentation Pandas Moshiul Arefin
30 pages
Python Notes
No ratings yet
Python Notes
110 pages
ETL Tester Skill Enhancement Guide
No ratings yet
ETL Tester Skill Enhancement Guide
1 page
Introduction To Tkinter
No ratings yet
Introduction To Tkinter
8 pages
Python Training Techavera
No ratings yet
Python Training Techavera
5 pages
Data Analytics With Python-1
No ratings yet
Data Analytics With Python-1
12 pages
Programming For Data Science With Python: Nanodegree Program Syllabus
No ratings yet
Programming For Data Science With Python: Nanodegree Program Syllabus
13 pages
SQL Database Notes
No ratings yet
SQL Database Notes
8 pages
12 Comp Sci 1 Revision Notes Pythan Advanced Prog
No ratings yet
12 Comp Sci 1 Revision Notes Pythan Advanced Prog
5 pages

Pandas

Uploaded by

Pandas

Uploaded by

Pandas

1. Pandas Data Structures - Hands-on

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

2. Working with CSVs

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

df_B4=pd.read_csv("classB.csv", header=None, skiprows=2)

3. Hands-on with Indexes

dates = pd.date_range(start= '2017/09/01', end='2017/09/15')

4. Access Elements in Data Structures

#Write your code here

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

df_s1s4 = df_A.loc[(df_A.index.str.endswith('1') | df_A.index.str.endswith('4'))]

5. Data Cleaning - Handson

#Write your code here

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

df_A2 = df_A.dropna(how ='any')

6. Data Aggregation - Handson

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

df_A_filter1 = df_A[(df_A.Student_height > 160.0) & (df_A.Student_weight < 80.0)]

df_A['Gender'] = ['M', 'F', 'M', 'M', 'F']

nameid = pd.Series(range(101, 111))

transaction = pd.DataFrame({'nameid':[108, 108, 108,103], 'product':['iPhone',

heights_A = pd.Series([176.2, 158.4, 167.6, 156.2, 161.4])

weights_A = pd.Series([85.1, 90.2, 76.8, 80.4 , 78.9])

df_A['Gender'] = ['M', 'F', 'M', 'M', 'F']

You might also like