如何识别Pandas数据集中的特定序列（往返）？

pd.DataFrame({'trader' : ['a','a','a','a','a','a','a'], 'stock' : ['a','a','a','a','a','a','b'], 'day' :[0,1,2,4,5,10,1], 'delta':[10,-10,15,-10,-5,5,6], 'cumq' : [10,0,15,5,0,5,6] , 'tag': [1,1,2,2,2,0,0]})

Out[15]: cumq day delta stock tag trader 0 10 0 10 a 1 a 1 0 1 -10 a 1 a 2 15 2 15 a 2 a 3 5 4 -10 a 2 a 4 0 5 -5 a 2 a 5 5 10 5 a 0 a 6 6 1 6 b 0 a

import pandas as pd import numpy as np df = pd.DataFrame({'trader' : ['a','a','a','a','a','a','a'],'stock' : ['a','a','a','a','a','a','b'], 'day' :[0,1,2,4,5,10,1],'delta':[10,-10,15,-10,-5,5,0] ,'out': [1,1,2,2,2,0,1]}) def proc_trader(_df): _df['tag'] = np.nan # make every ending of a roundtrip with its index _df['tag'][df.cumq == 0] = range(1, (_df.cumq == 0).sum() + 1) # backfill the roundtrip index until previous roundtrip; # then fill the rest with 0s (roundtrip incomplete for most recent trades) _df['tag'] = _df['tag'].fillna(method = 'bfill').fillna(0) return _df df.sort_values(by=['trader', 'stock','day'], inplace=True) df['cumq']=df.groupby(['trader', 'stock']).delta.transform('cumsum') df = df.groupby(['trader', 'stock']).apply(proc_trader)

1条回答

网友

1楼 · 发布于 2024-05-18 23:31:41

我会这样做：

import pandas as pd
import numpy as np

df = pd.DataFrame({'trader' : ['a','a','a','a','a','a','a'],'stock' : ['a','a','a','a','a','a','b'], 'day' :[0,1,2,4,5,10,1],'delta':[10,-10,15,-10,-5,5,6], 'cumq' : [10,0,15,5,0,6,11] ,'tag': [1,1,2,2,2,0,0]})

def proc_trader(_df):
    if _df.shape[0] == 1:
        _df['tag'] = _df['delta'] == 0
        return _df

    _df['tag'] = np.nan
    # make every ending of a roundtrip with its index
    _df['tag'][df.cumq == 0] = range(1, (df.cumq == 0).sum() + 1)
    # backfill the roundtrip index until previous roundtrip;
    # then fill the rest with 0s (roundtrip incomplete for most recent trades)
    _df['tag'] = _df['tag'].fillna(method = 'bfill').fillna(0)
    return _df

df = df.groupby(['trader', 'stock']).apply(proc_trader)

这个想法是，每个交易者的记录都由一系列的往返组成，除了最后可能出现的情况；这假设了应该如何计算零增量周期。我们检测往返周期的所有结束，反向支持索引并用0填充其余部分

相关问题更多 >

编程相关推荐

热门问题

热门文章