使用pandas数据帧生成一个类（更新）

import numpy as np import pandas as pd class logdata(): def __init__(self,size): self.size = size self.x = None self.timestamp = None self.confidence = 100 self.occurance = 1 def createdf(self): self.df = pd.DataFrame(data = None, columns = ['Timestamp','Label','Occurance', 'Confidence']) return self.df def insertdf(self, x, timestamp): self.occurance = self.get_occurance() self.confidence = self.get_confidence() self.df.loc[-1] = pd.Series({'Timestamp':timestamp, 'Label': x, 'Occurance':self.occurance, 'Confidence':self.confidence}) self.df.index = self.df.index + 1 self.df = self.df.sort_index() self.df = self.del_row() return self.df def get_occurance(self): return self.df.loc[self.df.Label == self.x, 'Label'].count() def get_confidence(self): y = self.df.shape[0] if y: conf = (self.occurance/self.df.shape[0])*100 else: conf = 100 return conf def del_row(self): if self.df.shape[0] > int(self.size): self.df = self.df.iloc[self.size:] return self.df def get_result(self): return self.df.loc[self.createdf['Confidence'].idxmax()]

1条回答

网友

1楼 · 发布于 2024-05-01 22:01:25

参见下面的修订代码。这会给你你想要的输出。如果您需要对任何代码进行澄清，请让我知道-但这是不言自明的。在

import pandas as pd

class logdata:
    def __init__(self, size):
        self.size = size
        self.df = pd.DataFrame(data = None, 
                               columns = ['Timestamp','Label','Occurance', 'Confidence'],
                              )

    def insertdf(self, x, timestamp):
        # default values
        occurance = 1
        confidence = 100

        self.df = self.df.append(pd.Series({
            'Timestamp': timestamp, 
            'Label': x, 
            'Occurance': occurance, 
            'Confidence': confidence
        }), ignore_index=True)

        self.df.sort_index(inplace=True, ascending=False)
        self.del_row()

        # Calculate the confidence and occurances of labels
        if self.df.shape[0] > 1:
            occurance = self.get_occurance()
            confidence = self.get_confidence(occurance)

            self.df['Occurance'] = self.df.Label.apply(lambda x: occurance[x])
            self.df['Confidence'] = self.df.Label.apply(lambda x: confidence[x])

        return self.df

    def get_occurance(self):
        # group by label and count
        occ = self.df.groupby('Label').Timestamp.count().rename('Occurance').astype(int)
        return occ

    def get_confidence(self, occurance):
        conf = ((occurance / sum(occurance)).rename('Confidence') * 100).astype(int)
        return conf

    def del_row(self):
        if self.df.shape[0] > int(self.size):
            self.df = self.df.head(self.size)

    def get_result(self):
        return self.df.loc[self.df['Confidence'].idxmax()]

相关问题更多 >

编程相关推荐

热门问题

热门文章