编制字典列表
我有一个字典的列表:
people = [{"name": "Roger", "city": "NY", "age": 20, "sex": "M"},
{"name": "Dan", "city": "Boston", "age": 20, "sex": "M"},
{"name": "Roger", "city": "Boston", "age": 21, "sex": "M"},
{"name": "Dana", "city": "Dallas", "age": 30, "sex": "F"}]
我想给它们分类,比如我选择这些键:
field = ("sex", "age")
我需要一个函数 catalogue(field, people)
,它能给我:
{ "M":
{ 20: [{"name": "Roger", "city": "NY", "age": 20, "sex": "M"},
{"name": "Dan", "city": "Boston", "age": 20, "sex": "M"}],
21: [{"name": "Roger", "city": "Boston", "age": 21, "sex": "M"}]
},
{ "F":
{ 30: [{"name": "Dana", "city": "Dallas", "age": 30, "sex": "F"}] }
}
当 len(field)==1
时,这个就简单了。我想做类似这样的事情:
c = catalogue(field, people)
for (sex, sex_value) in c.iteritems():
for (age, age_value) in sex_value.iteritems():
print sex, age, age_value["name"]
3 个回答
0
import pprint
people = [{"name": "Roger", "city": "NY", "age": 20, "sex": "M"},
{"name": "Dan", "city": "Boston", "age": 20, "sex": "M"},
{"name": "Roger", "city": "Boston", "age": 21, "sex": "M"},
{"name": "Dana", "city": "Dallas", "age": 30, "sex": "F"}]
fields = ("sex", "age")
result = {}
for person in people:
tempdict = result
for field in fields[:-1]:
if person[field] in tempdict:
tempdict = tempdict[person[field]]
else:
t = tempdict
tempdict = {}
t[person[field]] = tempdict
key = person[fields[-1]]
if key in tempdict:
tempdict[key].append(person)
else:
tempdict[key] = [person]
pprint.pprint(result)
看起来能解决问题。
0
这个方法不是最优的(其实可以用 defaultdict
来改进,比如说,但我当时机器上装的是 Python2.4),不过它能完成任务:
def catalogue(dicts, criteria):
if not criteria:
return dicts
criterion, rest = criteria[0], criteria[1:]
cat = {}
for d in dicts:
reducedDict = dict(d)
del reducedDict[criterion]
if d[criterion] in cat:
cat[d[criterion]].append(reducedDict)
else:
cat[d[criterion]] = [reducedDict]
retDict = {}
for key, val in cat.items():
retDict[key] = catalogue(val, rest)
return retDict
print catalogue(people, ("sex", "age"))
7
递归地:
import itertools, operator
def catalog(fields,people):
cur_field = operator.itemgetter(fields[0])
groups = itertools.groupby(sorted(people, key=cur_field),cur_field)
if len(fields)==1:
return dict((k,list(v)) for k,v in groups)
else:
return dict((k,catalog(fields[1:],v)) for k,v in groups)
测试:
import pprint
pprint.pprint(catalog(('sex','age'), people))
{'F': {30: [{'age': 30, 'city': 'Dallas', 'name': 'Dana', 'sex': 'F'}]},
'M': {20: [{'age': 20, 'city': 'NY', 'name': 'Roger', 'sex': 'M'},
{'age': 20, 'city': 'Boston', 'name': 'Dan', 'sex': 'M'}],
21: [{'age': 21, 'city': 'Boston', 'name': 'Roger', 'sex': 'M'}]}}