1 | frame.mad() |
1 | one 0.666667 |
1 | frame.var() |
1 | one 1.0 |
1 | frame.std() |
1 | one 1.000000 |
1 | frame.skew() |
1 | one 0.0 |
1 | pd.DataFrame([1,2,3,4,3,2,1,0]).kurt() |
1 | 0 -0.7 |
1 | frame, frame.quantile(0.5), frame.mean() |
1 | ( one two |
1 | frame.quantile(0.75) - frame.quantile(0.25) ### 离差IQR |
1 | one 1.0 |
1 | frame |
one | two | |
---|---|---|
a | 1.0 | NaN |
b | 2.0 | 4.0 |
c | NaN | NaN |
d | 3.0 | 5.0 |
1 | frame.cumsum() |
one | two | |
---|---|---|
a | 1.0 | NaN |
b | 3.0 | 4.0 |
c | NaN | NaN |
d | 6.0 | 9.0 |
1 | frame.cumprod() |
one | two | |
---|---|---|
a | 1.0 | NaN |
b | 2.0 | 4.0 |
c | NaN | NaN |
d | 6.0 | 20.0 |
1 | frame.cummax() |
one | two | |
---|---|---|
a | 1.0 | NaN |
b | 2.0 | 4.0 |
c | NaN | NaN |
d | 3.0 | 5.0 |
1 | frame |
one | two | |
---|---|---|
a | 1.0 | NaN |
b | 2.0 | 4.0 |
c | NaN | NaN |
d | 3.0 | 5.0 |
1 | frame.idxmax() |
1 | one d |
1 | frame.idxmax(axis=1) |
1 | a one |
1 | frame |
one | two | |
---|---|---|
a | 1.0 | NaN |
b | 2.0 | 4.0 |
c | NaN | NaN |
d | 3.0 | 5.0 |
1 | frame.describe() |
one | two | |
---|---|---|
count | 3.0 | 2.000000 |
mean | 2.0 | 4.500000 |
std | 1.0 | 0.707107 |
min | 1.0 | 4.000000 |
25% | 1.5 | 4.250000 |
50% | 2.0 | 4.500000 |
75% | 2.5 | 4.750000 |
max | 3.0 | 5.000000 |
1 | obj = pd.Series(['a', 'a', 'b', 'c'] * 4) |
1 | (0 a |
1 | # 数据准备 |
AAPL | GOOG | IBM | MSFT | |
---|---|---|---|---|
Date | ||||
2010-01-04 | NaN | NaN | NaN | NaN |
2010-01-05 | 0.001729 | -0.004404 | -0.012080 | 0.000323 |
2010-01-06 | -0.015906 | -0.025209 | -0.006496 | -0.006137 |
2010-01-07 | -0.001849 | -0.023280 | -0.003462 | -0.010400 |
2010-01-08 | 0.006648 | 0.013331 | 0.010035 | 0.006897 |
... | ... | ... | ... | ... |
2016-10-17 | -0.000680 | 0.001837 | 0.002072 | -0.003483 |
2016-10-18 | -0.000681 | 0.019616 | -0.026168 | 0.007690 |
2016-10-19 | -0.002979 | 0.007846 | 0.003583 | -0.002255 |
2016-10-20 | -0.000512 | -0.005652 | 0.001719 | -0.004867 |
2016-10-21 | -0.003930 | 0.003011 | -0.012474 | 0.042096 |
1714 rows × 4 columns
1 | returns['MSFT'].cov(returns['IBM']) |
8.870655479703546e-05
1 | returns.cov() |
AAPL | GOOG | IBM | MSFT | |
---|---|---|---|---|
AAPL | 0.000277 | 0.000107 | 0.000078 | 0.000095 |
GOOG | 0.000107 | 0.000251 | 0.000078 | 0.000108 |
IBM | 0.000078 | 0.000078 | 0.000146 | 0.000089 |
MSFT | 0.000095 | 0.000108 | 0.000089 | 0.000215 |
1 | returns['MSFT'].corr(returns['IBM']) |
1 | 0.4997636114415114 |
1 | returns.corr() |
AAPL | GOOG | IBM | MSFT | |
---|---|---|---|---|
AAPL | 1.000000 | 0.407919 | 0.386817 | 0.389695 |
GOOG | 0.407919 | 1.000000 | 0.405099 | 0.465919 |
IBM | 0.386817 | 0.405099 | 1.000000 | 0.499764 |
MSFT | 0.389695 | 0.465919 | 0.499764 | 1.000000 |
1 | returns.corrwith(returns.IBM) |
1 | AAPL 0.386817 |
1 | returns.corrwith(volume) # 一一对应 |
1 | AAPL -0.075565 |
1 | returns.T.corrwith(volume.T, axis=1) |
1 | AAPL -0.075565 |
1 | obj = pd.Series(['c', 'a', 'd', 'a', 'a', 'b', 'b', 'c', 'c']) |
array(['c', 'a', 'd', 'b'], dtype=object)
1 | frame = pd.DataFrame([[1, np.nan], [2, 4], |
1 | ( one two |
1 | obj = pd.Series(['c', 'a', 'd', 'a', 'a', 'b', 'b', 'c', 'c']) |
1 | c 3 |
1 | frame = pd.DataFrame([[1, 3, 5], [2, 4, 6], |
1 | ( one two thr |