import pandas as pd


pd.Series([1, 3, 2])

0    1
1    3
2    2
dtype: int64


ps = pd.Series([1, 3, 2], ['a', 'b', 'c'], name='PS', dtype=float)
ps

a    1.0
b    3.0
c    2.0
Name: PS, dtype: float64


ps.values

array([1., 3., 2.])


ps.index

Index(['a', 'b', 'c'], dtype='object')


ps['b'], ps.loc['b']

(3.000, 3.000)


ps[0], ps.iloc[0]

(1.000, 1.000)


ps['a':'b']

a    1.0
b    3.0
Name: PS, dtype: float64

ps

a    1.0
b    3.0
c    2.0
Name: PS, dtype: float64


ps > 1

a    False
b     True
c     True
Name: PS, dtype: bool


ps[ps > 1]

b    3.0
c    2.0
Name: PS, dtype: float64


ps[(ps > 1) & (ps < 3)]

c    2.0
Name: PS, dtype: float64


ps3 = pd.Series(['one', 'two', 'three'])
ps3[ps3.str.endswith('e')]

0      one
2    three
dtype: object


ps.sort_index()

a    1.0
b    3.0
c    2.0
Name: PS, dtype: float64


ps.sort_values()
# NOTE: Indices'follow' values through sorting

a    1.0
c    2.0
b    3.0
Name: PS, dtype: float64


ps
# NOTE: sort_xxx() returns a copy (inplace=False by default)

a    1.0
b    3.0
c    2.0
Name: PS, dtype: float64


ps.sort_index(ascending=False, inplace=True)
ps

c    2.0
b    3.0
a    1.0
Name: PS, dtype: float64


ps.sum()

6.000


ps.max()

3.000


ps.mean()

2.000


ps.std()

1.000


ps * 2

c    4.0
b    6.0
a    2.0
Name: PS, dtype: float64


ps1 = pd.Series([4, 5], ['a', 'c'])
ps1

a    4
c    5
dtype: int64


ps2 = ps + ps1
ps2
# NOTE: Elements are matched by Index!

a    5.0
b    NaN
c    7.0
dtype: float64


ps2.isnull()

a    False
b     True
c    False
dtype: bool


ps2.notnull()

a     True
b    False
c     True
dtype: bool


ps2.dropna()
# NOTE: returns a copy (inplace=False by default)

a    5.0
c    7.0
dtype: float64


ps2.fillna(0, inplace=True)
ps2

a    5.0
b    0.0
c    7.0
dtype: float64

ps2

a    5.0
b    0.0
c    7.0
dtype: float64


ps2.replace(0, -1)

a    5.0
b   -1.0
c    7.0
dtype: float64


ps2.replace([5, 7], -2)

a   -2.0
b    0.0
c   -2.0
dtype: float64


ps2.replace({0: -1, 7: -2})
# NOTE: Skips over missing keys

a    5.0
b   -1.0
c   -2.0
dtype: float64


ps2.map({0: -1, 7: -2})
# NOTE: Missing keys result in nulls

a    NaN
b   -1.0
c   -2.0
dtype: float64


ps2.apply(lambda x: x**2)

a    25.0
b     0.0
c    49.0
dtype: float64


df_dates = pd.DataFrame({'Date': pd.date_range('1/1/2020', periods=5, freq='2D')})
df_dates['Day'] = df_dates['Date'].dt.day
df_dates['DayOfWk'] = df_dates['Date'].dt.weekday
df_dates

df


df['ColA'].rolling(window=2).mean()

X    NaN
Y    2.5
Z    5.5
Name: ColA, dtype: float64


df['ColA'].cumsum()

X     1
Y     5
Z    12
Name: ColA, dtype: int64


df['ColA'].plot(kind='bar');

	Date	Day	DayOfWk
0	2020-01-01	1	2
1	2020-01-03	3	4
2	2020-01-05	5	6
3	2020-01-07	7	1
4	2020-01-09	9	3

Pandas Series Cheat Sheet¶

Create¶

Accessing Elements¶

Comparison and Filtering¶

Sorting¶

Computation¶

Vector Arithmetic¶

Series on Series Operations¶

Finding/Dropping/Filling Nulls(NaN)¶

Substitution¶

Misc¶

	ColA	ColB	ColC
X	1	2	3
Y	4	5	6
Z	7	8	9