快速/Pythonic方法来计算重复列表值之间的间隔

# make a 'histogram'/count of all the intervals between repeated values def hist_intervals(a): values = sorted(set(a)) # get list of which values are in a # setup the dict to hold the histogram hist, last_index = {}, {} for i in values: hist[i] = {} last_index[i] = -1 # some default value # now go through the array and find intervals for i in range(len(a)): val = a[i] if last_index[val] != -1: # do nothing if it's the first time interval = i - last_index[val] if interval in hist[val]: hist[val][interval] += 1 else: hist[val][interval] = 1 last_index[val] = i return hist # example list/array a = [1,2,3,1,5,3,2,4,2,1,5,3,3,4] histdict = hist_intervals(a) print("histdict = ",histdict) # correct answer for this example answer = { 1: {3:1, 6:1}, 2: {2:1, 5:1}, 3: {1:1, 3:1, 6:1}, 4: {6:1}, 5: {6:1} } print("answer = ",answer)

2条回答

网友

1楼 · 编辑于 2024-04-24 14:01:14

在数据结构方面有一个明显的变化。与其使用hist的字典，不如使用defaultdict的Counter这让代码变得

from collections import defaultdict, Counter

# make a 'histogram'/count of all the intervals between repeated values
def hist_intervals(a):
    values = sorted(set(a))  # get list of which values are in a

    # setup the dict to hold the histogram
    hist, last_index = defaultdict(Counter), {}

    # now go through the array and find intervals
    for i, val in enumerate(a):
        if val in last_index
            interval = i - last_index[val]
            hist[val].update((interval,))
        last_index[val] = i
    return hist

这会更快，因为if是用C写的，而且会更干净。你知道吗

网友

2楼 · 编辑于 2024-04-24 14:01:14

您可以通过仔细构造^{}来消除设置循环。然后你只需要对输入列表进行一次扫描，就可以了。在这里，我将结果defaultdict改回常规的Dict[int, Dict[int, int]]，但这只是为了让它打印得很好。你知道吗

from collections import defaultdict

def count_intervals(iterable):
    # setup

    last_seen = {}
    hist = defaultdict(lambda: defaultdict(int))

    # The actual work
    for i, x in enumerate(iterable):
        if x in last_seen:
            hist[x][i-last_seen[x]] += 1
        last_seen[x] = i

    return hist

a = [1,2,3,1,5,3,2,4,2,1,5,3,3,4]

hist = count_intervals(a)
for k, v in hist.items():
    print(k, dict(v))

# 1 {3: 1, 6: 1}
# 3 {3: 1, 6: 1, 1: 1}
# 2 {5: 1, 2: 1}
# 5 {6: 1}
# 4 {6: 1}

相关问题更多 >

编程相关推荐

热门问题

热门文章