如何根据df.idxmax系列制作基于日期的色条？

fig, ax = plt.subplots(1,1, figsize=(20,20)) smap=plt.scatter(df.col1, df.col2, s=140, c=[date2num(i.date()) for i in df.index], marker='.') cb = fig.colorbar(smap, orientation='vertical', format=DateFormatter('%d %b %y'))

for n in cols1: for m in cols2: fig, ax = plt.subplots(1,1, figsize=(15,15)) maxTimes=df2[n].idxmax() PlottableTimes=maxTimes.dropna() #some NaNs in the #.idxmax series were giving date2num trouble smap2=plt.scatter(df2[n].max(), df2[m].max(), s=160, c=[date2num(i.date()) for i in PlottableTimes], marker='.') cb2 = fig.colorbar(smap2, orientation='vertical', format=DateFormatter('%d %b %y')) plt.show()

df=pd.DataFrame(np.random.randint(low=0, high=10, size=(169, 8)), columns=['a', 'b', 'c', 'd', 'e','f','g','h']) #make sample data date_rng = pd.date_range(start='1/1/2018', end='1/8/2018', freq='H') df['i']=date_rng df = df.set_index('i') #get a datetime index df['ts']=date_rng #get a datetime column to group by from pandas import Grouper df2=df.groupby(Grouper(key='ts', freq='D')) for n in ['a','b','c','d']: #now make some plots for m in ['e','f','g','h']: print(m) print(n) fig, ax = plt.subplots(1,1, figsize=(5,5)) maxTimes=df2[n].idxmax() PlottableTimes=maxTimes.dropna() smap=plt.scatter(df2[n].max(), df2[m].max(), s=160, c=[date2num(i.date()) for i in PlottableTimes], marker='.') cb = fig.colorbar(smap, orientation='vertical', format=DateFormatter('%d %b %y')) plt.show()

for n in ['a','b','c','d']: for m in ['e','f','g','h']: print(m) print(n) fig, ax = plt.subplots(1,1, figsize=(5,5)) maxTimes=df2[n].idxmax() PlottableTimes=maxTimes.dropna() smap=plt.scatter(df2[n].max(), df2[m].max(), s=160, c=[736809.0, 736810.0, 736811.0, 736812.0, 736813.0, 736814.0, 736815.0, 736816.0], marker='.') cb = fig.colorbar(smap, orientation='vertical', format=DateFormatter('%d %b %y')) plt.show()

for n in ['a','b','c','d']: for m in ['e','f','g','h']: print(m) print(n) fig, ax = plt.subplots(1,1, figsize=(5,5)) maxTimes=df2[n].idxmax() PlottableTimes=maxTimes.dropna() smap=plt.scatter(df2[n].max(), df2[m].max(), s=160, c=[736809.0, 736810.0, 736811.0, 736812.0, 736813.0, 736814.0], marker='.') cb = fig.colorbar(smap, orientation='vertical', format=DateFormatter('%d %b %y')) plt.show()

1条回答

网友

1楼 · 发布于 2024-06-11 11:33:02

本质上，您的Grouper调用类似于对日期时间列进行索引，并调用^{}指定聚合函数：

df.set_index('ts').resample('D').max()
#             a  b  c  d  e  f  g  h
# ts                                
# 2018-01-01  9  9  8  9  9  9  9  9
# 2018-01-02  9  9  9  9  9  9  9  9
# 2018-01-03  9  9  9  9  9  9  9  9
# 2018-01-04  9  9  9  9  9  9  9  9
# 2018-01-05  9  9  9  9  9  9  9  9
# 2018-01-06  9  9  9  8  9  9  9  9
# 2018-01-07  9  9  9  9  9  9  9  9
# 2018-01-08  2  8  6  3  1  3  2  7

因此，df2['a'].max()的返回是一个Pandas重采样器对象，非常类似于Pandas系列，因此带有可用于颜色条规范的index属性：

df['a'].max().index

# DatetimeIndex(['2018-01-01', '2018-01-02', '2018-01-03', '2018-01-04',
#                '2018-01-05', '2018-01-06', '2018-01-07', '2018-01-08'],
#               dtype='datetime64[ns]', name='ts', freq='D')

从那里你可以进入date2num而无需理解列表：

date2num(df2['a'].max().index)

# array([736695., 736696., 736697., 736698., 736699., 736700., 736701., 736702.])

总之，只需在循环中使用上述内容，而无需maxTimes或PlottableTimes：

fig, ax = plt.subplots(1, 1, figsize = (5,5))

smap = plt.scatter(df2[n].max(), df2[m].max(), s = 160, 
                   c = date2num(df2[n].max().index), 
                   marker = '.')
cb = fig.colorbar(smap, orientation = 'vertical',
                  format = DateFormatter('%d %b %y'))

相关问题更多 >

编程相关推荐

热门问题

热门文章