缓存应用中Redis与磁盘的性能比较

import redis import time def load_file(fp, fpKey, r, expiry): with open(fp, "rb") as f: data = f.read() p = r.pipeline() p.set(fpKey, data) p.expire(fpKey, expiry) p.execute() return data def cache_or_get_gen(fp, expiry=300, r=redis.Redis(db=5)): fpKey = "cached:"+fp while True: yield load_file(fp, fpKey, r, expiry) t = time.time() while time.time() - t - expiry < 0: yield r.get(fpKey) def cache_or_get(fp, expiry=300, r=redis.Redis(db=5)): fpKey = "cached:"+fp if r.exists(fpKey): return r.get(fpKey) else: with open(fp, "rb") as f: data = f.read() p = r.pipeline() p.set(fpKey, data) p.expire(fpKey, expiry) p.execute() return data def mem_cache(fp): with open(fp, "rb") as f: data = f.readlines() while True: yield data def stressTest(fp, trials = 10000): # Read the file x number of times a = time.time() for x in range(trials): with open(fp, "rb") as f: data = f.read() b = time.time() readAvg = trials/(b-a) # Generator version # Read the file, cache it, read it with a new instance each time a = time.time() gen = cache_or_get_gen(fp) for x in range(trials): data = next(gen) b = time.time() cachedAvgGen = trials/(b-a) # Read file, cache it, pass in redis instance each time a = time.time() r = redis.Redis(db=6) gen = cache_or_get_gen(fp, r=r) for x in range(trials): data = next(gen) b = time.time() inCachedAvgGen = trials/(b-a) # Non generator version # Read the file, cache it, read it with a new instance each time a = time.time() for x in range(trials): data = cache_or_get(fp) b = time.time() cachedAvg = trials/(b-a) # Read file, cache it, pass in redis instance each time a = time.time() r = redis.Redis(db=6) for x in range(trials): data = cache_or_get(fp, r=r) b = time.time() inCachedAvg = trials/(b-a) # Read file, cache it in python object a = time.time() for x in range(trials): data = mem_cache(fp) b = time.time() memCachedAvg = trials/(b-a) print "\n%s file reads: %.2f reads/second\n" %(trials, readAvg) print "Yielding from generators for data:" print "multi redis instance: %.2f reads/second (%.2f percent)" %(cachedAvgGen, (100*(cachedAvgGen-readAvg)/(readAvg))) print "single redis instance: %.2f reads/second (%.2f percent)" %(inCachedAvgGen, (100*(inCachedAvgGen-readAvg)/(readAvg))) print "Function calls to get data:" print "multi redis instance: %.2f reads/second (%.2f percent)" %(cachedAvg, (100*(cachedAvg-readAvg)/(readAvg))) print "single redis instance: %.2f reads/second (%.2f percent)" %(inCachedAvg, (100*(inCachedAvg-readAvg)/(readAvg))) print "python cached object: %.2f reads/second (%.2f percent)" %(memCachedAvg, (100*(memCachedAvg-readAvg)/(readAvg))) if __name__ == "__main__": fileToRead = "templates/index.html" stressTest(fileToRead)

10000 file reads: 30971.94 reads/second Yielding from generators for data: multi redis instance: 8489.28 reads/second (-72.59 percent) single redis instance: 8801.73 reads/second (-71.58 percent) Function calls to get data: multi redis instance: 5396.81 reads/second (-82.58 percent) single redis instance: 5419.19 reads/second (-82.50 percent) python cached object: 1522765.03 reads/second (4816.60 percent)

if r.exists(fpKey): data = r.get(fpKey) Function calls to get data using r.exists as test multi redis instance: 5320.51 reads/second (-82.34 percent) single redis instance: 5308.33 reads/second (-82.38 percent) python cached object: 1494123.68 reads/second (5348.17 percent) Function calls to get data using if data as test multi redis instance: 8540.91 reads/second (-71.25 percent) single redis instance: 7888.24 reads/second (-73.45 percent) python cached object: 1520226.17 reads/second (5132.01 percent)

Total number of files: 700 10000 file reads: 274.28 reads/second Yielding from generators for data: multi redis instance: 15393.30 reads/second (5512.32 percent) single redis instance: 13228.62 reads/second (4723.09 percent) Function calls to get data: multi redis instance: 11213.54 reads/second (3988.40 percent) single redis instance: 14420.15 reads/second (5157.52 percent) python cached object: 607649.98 reads/second (221446.26 percent)

Total number of files: 700 40000 file reads: 1168.23 reads/second Yielding from generators for data: multi redis instance: 14900.80 reads/second (1175.50 percent) single redis instance: 14318.28 reads/second (1125.64 percent) Function calls to get data: multi redis instance: 13563.36 reads/second (1061.02 percent) single redis instance: 13486.05 reads/second (1054.40 percent) python cached object: 587785.35 reads/second (50214.25 percent)

Total number of files: 700 10000 file reads: 284.48 reads/second Yielding from generators for data: single redis instance: 11627.56 reads/second (3987.36 percent) Function calls to get data: single redis instance: 14615.83 reads/second (5037.81 percent) python cached object: 580285.56 reads/second (203884.21 percent)

1条回答

网友

1楼 · 发布于 2024-05-14 10:47:57

这是一个苹果对桔子的比较。见http://redis.io/topics/benchmarks

Redis是一种高效的远程数据存储。每次在Redis上执行命令时，都会向Redis服务器发送一条消息，如果客户端是同步的，则会阻止等待回复。因此，除了命令本身的成本之外，您还将支付网络往返或IPC的费用。

在现代硬件上，与其他操作相比，网络往返或ipc的成本高得惊人。这是由以下几个因素造成的：

媒体的原始延迟（主要用于网络）
操作系统计划程序的延迟（Linux/Unix上不保证）
内存缓存未命中是昂贵的，当客户机和服务器进程被安排入/出时，缓存未命中的概率会增加。
高端盒子，NUMA副作用

现在，让我们回顾一下结果。

比较使用生成器和使用函数调用的实现，它们生成的Redis往返次数不同。使用发电机，您只需：

    while time.time() - t - expiry < 0:
        yield r.get(fpKey)

每次迭代一次往返。使用该功能，您可以：

if r.exists(fpKey):
    return r.get(fpKey)

每次迭代2次往返。难怪发电机更快。

当然，您应该重用相同的Redis连接以获得最佳性能。没有必要运行系统连接/断开连接的基准。

最后，关于Redis调用和文件读取之间的性能差异，您只需将本地调用与远程调用进行比较。文件读取由OS文件系统缓存，因此它们是内核和Python之间的快速内存传输操作。这里不涉及磁盘I/O。使用Redis，您必须支付往返的费用，因此速度要慢得多。

相关问题更多 >

编程相关推荐

热门问题

热门文章