计算一组关系的整数映射的更有效算法

relations = [('a', 'c'), ('b', 'c'), ('b', 'd', 'e')] print(relations) values = dict.fromkeys(set(sum(relations, ())), 0) print(values) converged = False while not converged: converged = True for relation in relations: for i in range(1,len(relation)): if values[relation[i]] <= values[relation[i-1]]: converged = False values[relation[i]] += values[relation[i-1]]-values[relation[i]]+1 print(values)

relations = [('a', 'c'), ('b', 'c'), ('b', 'd'), ('b', 'e'), ('d', 'e')] symbols = set(sum(relations, ())) numIncoming = dict.fromkeys(symbols, 0) values = {} for rel in relations: numIncoming[rel[1]] += 1 k = 0 n = len(symbols) c = 0 while k < n: curs = [sym for sym in symbols if numIncoming[sym] == 0] curr = [rel for rel in relations if rel[0] in curs] for sym in curs: symbols.remove(sym) values[sym] = c for rel in curr: relations.remove(rel) numIncoming[rel[1]] -= 1 c += 1 k += len(curs) print(values)

vector<unsigned> chunked_topsort(const vector<vector<unsigned>>& relations, unsigned n) { vector<unsigned> ret(n); vector<set<unsigned>> succs(n); vector<unsigned> npreds(n); set<unsigned> allelts; set<unsigned> nopreds; for(auto i = n; i--;) allelts.insert(i); for(const auto& r : relations) { auto u = r[0]; if(npreds[u] == 0) nopreds.insert(u); for(size_t i = 1; i < r.size(); ++i) { auto v = r[i]; if(npreds[v] == 0) nopreds.insert(v); if(succs[u].count(v) == 0) { succs[u].insert(v); npreds[v] += 1; nopreds.erase(v); } u = v; } } set<unsigned> next; unsigned chunk = 0; while(!nopreds.empty()) { next.clear(); for(const auto& u : nopreds) { ret[u] = chunk; allelts.erase(u); for(const auto& v : succs[u]) { npreds[v] -= 1; if(npreds[v] == 0) next.insert(v); } } swap(nopreds, next); ++chunk; } assert(allelts.empty()); return ret; }

vector<unsigned> chunked_topsort2(const vector<vector<unsigned>>& relations, unsigned n) { vector<unsigned> ret(n); vector<unsigned> npreds(n); vector<tuple<unsigned, unsigned>> flat_relations; flat_relations.reserve(relations.size()); vector<unsigned> relation_offsets(n+1); for(const auto& r : relations) { if(r.size() < 2) continue; for(size_t i = 0; i < r.size()-1; ++i) { assert(r[i] < n && r[i+1] < n); flat_relations.emplace_back(r[i], r[i+1]); relation_offsets[r[i]+1] += 1; npreds[r[i+1]] += 1; } } partial_sum(relation_offsets.begin(), relation_offsets.end(), relation_offsets.begin()); sort(flat_relations.begin(), flat_relations.end()); vector<unsigned> nopreds; for(unsigned i = 0; i < n; ++i) if(npreds[i] == 0) nopreds.push_back(i); vector<unsigned> next; unsigned chunk = 0; while(!nopreds.empty()) { next.clear(); for(const auto& u : nopreds) { ret[u] = chunk; for(unsigned i = relation_offsets[u]; i < relation_offsets[u+1]; ++i) { auto v = std::get<1>(flat_relations[i]); npreds[v] -= 1; if(npreds[v] == 0) next.push_back(v); } } swap(nopreds, next); ++chunk; } assert(all_of(npreds.begin(), npreds.end(), [](unsigned i) { return i == 0; })); return ret; }

1条回答

网友

1楼 · 发布于 2024-05-23 16:54:16

下面是一个我之前没有时间发布的实现：

def chunked_topsort(relations):
    # `relations` is an iterable producing relations.
    # A relation is a sequence, interpreted to mean
    # relation[0] < relation[1] < relation[2] < ...
    # The result is a list such that
    # result[i] is the set of elements assigned to i.
    from collections import defaultdict
    succs = defaultdict(set)    # new empty set is default
    npreds = defaultdict(int)   # 0 is default
    allelts = set()
    nopreds = set()

    def add_elt(u):
        allelts.add(u)
        if npreds[u] == 0:
            nopreds.add(u)

    for r in relations:
        u = r[0]
        add_elt(u)
        for i in range(1, len(r)):
            v = r[i]
            add_elt(v)
            if v not in succs[u]:
                succs[u].add(v)
                npreds[v] += 1
                nopreds.discard(v)
            u = v
    result = []
    while nopreds:
        result.append(nopreds)
        allelts -= nopreds
        next_nopreds = set()
        for u in nopreds:
            for v in succs[u]:
                npreds[v] -= 1
                assert npreds[v] >= 0
                if npreds[v] == 0:
                    next_nopreds.add(v)
        nopreds = next_nopreds
    if allelts:
        raise ValueError("elements in cycles %s" % allelts)
    return result

然后，例如

^{pr2}$

希望有帮助。注意这里没有任何搜索（例如，没有条件列表理解）。从理论上讲，它是有效的。在

稍后：计时

在您的文章末尾生成的测试数据中，chunked_topsort()对输入的顺序几乎不敏感。这并不奇怪，因为算法只迭代输入一次，以构建其（固有的无序）dicts和set。总之，它比Version B快15到20倍。3次运行的典型定时输出：

worst chunked  0.007 B  0.129 B/chunked  19.79
best  chunked  0.007 B  0.110 B/chunked  16.85
avg   chunked  0.006 B  0.118 B/chunked  19.06

worst chunked  0.007 B  0.127 B/chunked  18.25
best  chunked  0.006 B  0.103 B/chunked  17.16
avg   chunked  0.006 B  0.119 B/chunked  18.86

worst chunked  0.007 B  0.132 B/chunked  20.20
best  chunked  0.007 B  0.105 B/chunked  16.04
avg   chunked  0.007 B  0.113 B/chunked  17.32

使用更简单的数据结构

假设问题已经改变；-），这里有一个重写，假设输入是range(n)中的整数，并且{}也被传递。在输入关系的初始传递之后，没有集合，没有dict，也没有动态分配。在Python中，这比测试数据上的chunked_topsort()快大约40%。但是我太老了，不能再和C++搏斗了。————<

def ct_special(relations, n):
    # `relations` is an iterable producing relations.
    # A relation is a sequence, interpreted to mean
    # relation[0] < relation[1] < relation[2] < ...
    # All elements are in range(n).
    # The result is a vector of length n such that
    # result[i] is the ordinal assigned to i, or
    # result[i] is -1 if i didn't appear in the relations.
    succs = [[] for i in xrange(n)]
    npreds = [-1] * n
    nopreds = [-1] * n
    numnopreds = 0

    def add_elt(u):
        if not 0 <= u < n:
            raise ValueError("element %s out of range" % u)
        if npreds[u] < 0:
            npreds[u] = 0

    for r in relations:
        u = r[0]
        add_elt(u)
        for i in range(1, len(r)):
            v = r[i]
            add_elt(v)
            succs[u].append(v)
            npreds[v] += 1
            u = v

    result = [-1] * n
    for u in xrange(n):
        if npreds[u] == 0:
            nopreds[numnopreds] = u
            numnopreds += 1

    ordinal = nopreds_start = 0
    while nopreds_start < numnopreds:
        next_nopreds_start = numnopreds
        for i in xrange(nopreds_start, numnopreds):
            u = nopreds[i]
            result[u] = ordinal
            for v in succs[u]:
                npreds[v] -= 1
                assert npreds[v] >= 0
                if npreds[v] == 0:
                    nopreds[numnopreds] = v
                    numnopreds += 1
        nopreds_start = next_nopreds_start
        ordinal += 1
    if any(count > 0 for count in npreds):
        raise ValueError("elements in cycles")
    return result

这在Python中同样对输入顺序不敏感。在

稍后：计时

使用更简单的数据结构

相关问题更多 >

编程相关推荐

热门问题

热门文章