使用Django模型将JSON数据写入关系数据库的最优雅方法是什么？

class NinjaData(models.Model): id = models.IntegerField(primary_key=True, unique=True) name = models.CharField(max_length=60) birthdatetime = MyDateTimeField(null=True) deathdatetime = MyDatetimeField(null=True) skills = models.ManyToManyField(Skills, null=True) weapons = models.ManyToManyField(Weapons, null=True) master = models.ForeignKey(Master, null=True) class Skills(models.Model): id = models.IntegerField(primary_key=True, unique=True) name = models.CharField(max_length=60) difficulty = models.IntegerField(null=True) class Weapons(models.Model): id = models.IntegerField(primary_key=True, unique=True) name = models.CharField(max_length=60) weight = models.FloatField(null=True) class Master(models.Model): id = models.IntegerField(primary_key=True, unique=True) name = models.CharField(max_length=60) is_awesome = models.NullBooleanField()

{ "id":"1234", "name":"Hitori", "birthdatetime":"11/05/1999 20:30:00", "skills":[ { "id":"3456", "name":"stealth", "difficulty":"2" }, { "id":"678", "name":"karate", "difficulty":"1" } ], "weapons":[ { "id":"878", "name":"shuriken", "weight":"0.2" }, { "id":"574", "name":"katana", "weight":"0.5" } ], "master":{ "id":"4", "name":"Schi fu", "is_awesome":"true" } }

data = json.loads(ninja_json) ninja = NinjaData.objects.create(id=data['id'], name=data['name']) if 'weapons' in data: weapons = data['weapons'] for weapon in weapons: w = Weapons.objects.get_or_create(**weapon) # create a new weapon in Weapon table ninja.weapons.add(w) if 'skills' in data: ... (skipping rest of the code for brevity)

3条回答

网友

1楼 · 编辑于 2024-04-20 02:58:06

我不知道您是否熟悉这个术语，但您基本上要做的是从序列化/string格式（在本例中是JSON）反序列化到Python模型对象中。

我不熟悉Python库使用JSON来实现这一点，所以我不推荐/支持任何一个，但是使用诸如“Python”、“反序列化”、“JSON”、“object”和“graph”之类的术语进行搜索似乎可以揭示github上的some Django documentation for serialization和库jsonpickle。

网友

2楼 · 编辑于 2024-04-20 02:58:06

实际上我也有同样的需求，我编写了一个自定义数据库字段来处理它。只需将以下内容保存在项目的Python模块中（例如，在适当的应用程序中保存一个fields.py文件），然后导入并使用它：

class JSONField(models.TextField):
    """Specialized text field that holds JSON in the database, which is
    represented within Python as (usually) a dictionary."""

    __metaclass__ = models.SubfieldBase

    def __init__(self, blank=True, default='{}', help_text='Specialized text field that holds JSON in the database, which is represented within Python as (usually) a dictionary.', *args, **kwargs):
        super(JSONField, self).__init__(*args, blank=blank, default=default, help_text=help_text, **kwargs)

    def get_prep_value(self, value):
        if type(value) in (str, unicode) and len(value) == 0:
            value = None
        return json.dumps(value)

    def formfield(self, form_class=JSONFormField, **kwargs):
        return super(JSONField, self).formfield(form_class=form_class, **kwargs)

    def bound_data(self, data, initial):
        return json.dumps(data)

    def to_python(self, value):
        # lists, dicts, ints, and booleans are clearly fine as is
        if type(value) not in (str, unicode):
            return value

        # empty strings were intended to be null
        if len(value) == 0:
            return None

        # NaN should become null; Python doesn't have a NaN value
        if value == 'NaN':
            return None

        # try to tell the difference between a "normal" string
        # and serialized JSON
        if value not in ('true', 'false', 'null') and (value[0] not in ('{', '[', '"') or value[-1] not in ('}', ']', '"')):
            return value

        # okay, this is a JSON-serialized string
        return json.loads(value)

几件事。首先，如果您使用的是South，则需要向它解释自定义字段的工作原理：

from south.modelsinspector import add_introspection_rules
add_introspection_rules([], [r'^feedmagnet\.tools\.fields\.models\.JSONField'])

其次，虽然我已经做了很多工作来确保这个自定义字段在任何地方都能很好地运行，比如在序列化格式和Python之间来回地运行。有一个地方它不能很好地工作，那就是当它与manage.py dumpdata一起使用时，它将Python合并为一个字符串，而不是将其转储为JSON，这不是您想要的。我发现这在实际操作中是个小问题。

关于writing custom model fields的更多文档。

我断言这是唯一最好和最明显的方法。请注意，我还假设您不需要对这些数据执行查找操作——例如，您将根据其他条件检索记录，这将与它一起提供。如果需要基于JSON中的某些内容进行查找，请确保它是一个真正的SQL字段（并确保它是索引的！）。

网友

3楼 · 编辑于 2024-04-20 02:58:06

在我看来，您需要的代码最干净的地方是在NinjaData模型的自定义管理器上作为一个新的管理器方法（例如从json字符串）。

我不认为你应该重写标准的create、get或create etc方法，因为你做的事情与他们通常做的有点不同，保持他们正常工作是很好的。

更新： 我意识到我可能在某个时候想要这个，所以我编写了代码，并对一个泛型函数进行了简单的测试。因为它递归地遍历并影响其他模型，所以我不再确定它属于Manager方法，而且可能应该是一个独立的helper函数。

def create_or_update_and_get(model_class, data):
    get_or_create_kwargs = {
        model_class._meta.pk.name: data.pop(model_class._meta.pk.name)
    }
    try:
        # get
        instance = model_class.objects.get(**get_or_create_kwargs)
    except model_class.DoesNotExist:
        # create
        instance = model_class(**get_or_create_kwargs)
    # update (or finish creating)
    for key,value in data.items():
        field = model_class._meta.get_field(key)
        if not field:
            continue
        if isinstance(field, models.ManyToManyField):
            # can't add m2m until parent is saved
            continue
        elif isinstance(field, models.ForeignKey) and hasattr(value, 'items'):
            rel_instance = create_or_update_and_get(field.rel.to, value)
            setattr(instance, key, rel_instance)
        else:
            setattr(instance, key, value)
    instance.save()
    # now add the m2m relations
    for field in model_class._meta.many_to_many:
        if field.name in data and hasattr(data[field.name], 'append'):
            for obj in data[field.name]:
                rel_instance = create_or_update_and_get(field.rel.to, obj)
                getattr(instance, field.name).add(rel_instance)
    return instance

# for example:
from django.utils.simplejson import simplejson as json

data = json.loads(ninja_json)
ninja = create_or_update_and_get(NinjaData, data)

相关问题更多 >

编程相关推荐

热门问题

热门文章