import pandas as pd
my_list=[7,'Beijing','19大',3.1415,-10000,'Happy']
s=pd.Series(my_list)
print(type(s))
print(s)
0 7
1 Beijing
2 19大
3 3.1415
4 -10000
5 Happy
dtype: object
s=pd.Series([7,'Beijing','19大',3.1415,-10000,'Happy'],
index=['A','B','C','D','E','F'])
print(s)
A 7
B Beijing
C 19大
D 3.1415
E -10000
F Happy
dtype: object
cities={'Beijing':55000,'Shanghai':60000,'shenzhen':50000,'Hangzhou':20000,'Guangzhou':45000,'Suzhou':None}
apts=pd.Series(cities,name='income')
print(apts)
Beijing 55000.0
Guangzhou 45000.0
Hangzhou 20000.0
Shanghai 60000.0
Suzhou NaN
shenzhen 50000.0
Name: income, dtype: float64
import numpy as np
d=pd.Series(np.random.randn(5),index=['a','b','c','d','e'])
print(d)
a -0.329401
b -0.435921
c -0.232267
d -0.846713
e -0.406585
dtype: float64
import pandas as pd
cities={'Beijing':55000,'Shanghai':60000,'shenzhen':50000,'Hangzhou':20000,'Guangzhou':45000,'Suzhou':None}
apts=pd.Series(cities,name='income')
print(apts)
Beijing 55000.0
Guangzhou 45000.0
Hangzhou 20000.0
Shanghai 60000.0
Suzhou NaN
shenzhen 50000.0
Name: income, dtype: float64
print(apts[3])
60000.0
print(apts[[3,4,1]])
Shanghai 60000.0
Suzhou NaN
Guangzhou 45000.0
Name: income, dtype: float64
print(apts[1:])
Guangzhou 45000.0
Hangzhou 20000.0
Shanghai 60000.0
Suzhou NaN
shenzhen 50000.0
Name: income, dtype: float64
print(apts[:-2])
Beijing 55000.0
Guangzhou 45000.0
Hangzhou 20000.0
Shanghai 60000.0
Name: income, dtype: float64
print(apts[1:]+apts[:-1])
Beijing NaN
Guangzhou 90000.0
Hangzhou 40000.0
Shanghai 120000.0
Suzhou NaN
shenzhen NaN
Name: income, dtype: float64
import pandas as pd
cities={'Beijing':55000,'Shanghai':60000,'shenzhen':50000,'Hangzhou':20000,'Guangzhou':45000,'Suzhou':None}
apts=pd.Series(cities,name='income')
print(apts['Shanghai']) ###
60000.0
print('Hangzhou' in apts)
True
print('Choingqing' in apts)
False
import pandas as pd
cities={'Beijing':55000,'Shanghai':60000,'shenzhen':50000,'Hangzhou':20000,'Guangzhou':45000,'Suzhou':None}
apts=pd.Series(cities,name='income')
less_than_50000=(apts<=50000) ###
print(apts[less_than_50000])
Guangzhou 45000.0
Hangzhou 20000.0
shenzhen 50000.0
Name: income, dtype: float64
注:可以使用numpy的各种函数mean,median,max,min
print(apts.mean())
46000.0
import pandas as pd
cities={'Beijing':55000,'Shanghai':60000,'shenzhen':50000,'Hangzhou':20000,'Guangzhou':45000,'Suzhou':None}
apts=pd.Series(cities,name='income')
print(apts)
print('Old income of shenzhen:{}'.format(apts['shenzhen']))
Beijing 55000.0
Guangzhou 45000.0
Hangzhou 20000.0
Shanghai 60000.0
Suzhou NaN
shenzhen 50000.0
Name: income, dtype: float64
Old income of shenzhen:50000.0
apts['shenzhen']=70000 ###
print(apts)
print('New income of shenzhen:{}'.format(apts['shenzhen']))
Beijing 55000.0
Guangzhou 45000.0
Hangzhou 20000.0
Shanghai 60000.0
Suzhou NaN
shenzhen 70000.0
Name: income, dtype: float64
New income of shenzhen:70000.0
import pandas as pd
cities={'Beijing':55000,'Shanghai':60000,'shenzhen':50000,'Hangzhou':20000,'Guangzhou':45000,'Suzhou':None}
apts=pd.Series(cities,name='income')
apts['shenzhen']=70000
print('New income of shenzhen:{}'.format(apts['shenzhen']))
less_than_50000=(apts<50000) ###
print(less_than_50000)
apts[less_than_50000]=40000 ###
print(apts)
Beijing False
Guangzhou True
Hangzhou True
Shanghai False
Suzhou False
shenzhen False
Name: income, dtype: bool
Beijing 55000.0
Guangzhou 40000.0
Hangzhou 40000.0
Shanghai 60000.0
Suzhou NaN
shenzhen 70000.0
Name: income, dtype: float64
import pandas as pd
import numpy as np
cities={'Beijing':55000,'Shanghai':60000,'shenzhen':50000,'Hangzhou':20000,'Guangzhou':45000,'Suzhou':None}
apts=pd.Series(cities,name='income')
apts['shenzhen']=70000
print('New income of shenzhen:{}'.format(apts['shenzhen']))
less_than_50000=(apts<50000)
apts[less_than_50000]=40000
print(apts)
print(apts/2) ###
print(apts**1.5) ###
print(np.log(apts)) ###
apts2=pd.Series({'Beijing':10000,'Shanghai':8000,'shenzhen':6000,'Tianjin':40000,'Guangzhou':7000,'Chongqing':30000})
print(apts2)
print(apts+apts2) ###
cities={'Beijing':55000,'Shanghai':60000,'shenzhen':50000,'Hangzhou':20000,'Guangzhou':45000,'Suzhou':None}
apts=pd.Series(cities,name='income')
apts['shenzhen']=70000
less_than_50000=(apts<50000)
apts[less_than_50000]=40000
print(apts)
Beijing 55000.0
Guangzhou 40000.0
Hangzhou 40000.0
Shanghai 60000.0
Suzhou NaN
shenzhen 70000.0
Name: income, dtype: float64
apts2=pd.Series({'Beijing':10000,'Shanghai':8000,'shenzhen':6000,'Tianjin':40000,'Guangzhou':7000,'Chongqing':30000})
print(apts2)
Beijing 10000
Chongqing 30000
Guangzhou 7000
Shanghai 8000
Tianjin 40000
shenzhen 6000
dtype: int64
print('Hangzhou' in apts) ###
print('Hangzhou' in apts2)
True
False
print(apts.notnull()) #boolean条件 ###
Beijing True
Guangzhou True
Hangzhou True
Shanghai True
Suzhou False
shenzhen True
Name: income, dtype: bool
print(apts.isnull()) ###
Beijing False
Guangzhou False
Hangzhou False
Shanghai False
Suzhou True
shenzhen False
Name: income, dtype: bool
print(apts[apts.isnull()]) #利用缺失索引布尔值取元素
Suzhou NaN
Name: income, dtype: float64
apts=apts+apts2 #索引缺失相加
print(apts)
Beijing 65000.0
Chongqing NaN
Guangzhou 47000.0
Hangzhou NaN
Shanghai 68000.0
Suzhou NaN
Tianjin NaN
shenzhen 76000.0
dtype: float64
apts[apts.isnull()]=apts.mean() #将缺失位置赋值为中值
print(apts)
Beijing 65000.0
Chongqing 64000.0
Guangzhou 47000.0
Hangzhou 64000.0
Shanghai 68000.0
Suzhou 64000.0
Tianjin 64000.0
shenzhen 76000.0
dtype: float64