在python中递归查找目录中文件的md5

def print_files(file_directory, file_extensions=['10']): ''' Print files in file_directory with extensions in file_extensions, recursively. ''' # Get the absolute path of the file_directory parameter file_directory = os.path.abspath(file_directory) # Get a list of files in file_directory file_directory_files = os.listdir(file_directory) # Traverse through all files for filename in file_directory_files: filepath = os.path.join(file_directory, filename) # Check if it's a normal file or directory if os.path.isfile(filepath): # Check if the file has an extension of typical video files for file_extension in file_extensions: # Not a reqd file, ignore #if not filepath.endswith(file_extension): if not filename.startswith(file_extension) or len(filename) != 19: continue # We have got a '10' file! print_files.counter += 1 ## TRYING TO READ AND PRINT MD5 USING HASHLIB/ DOESNT WORK### hasher = hashlib.md5() with open(filename, 'rb') as afile: buf = afile.read(65536) while len(buf) > 0: hasher.update(buf) buf = afile.read(65536) # Print it's name print('{0}'.format(filepath)) print hasher('{0}.format(filepath)').hexdigest() print '\n' elif os.path.isdir(filepath): # We got a directory, enter into it for further processing print_files(filepath) if __name__ == '__main__': # Directory argument supplied if len(sys.argv) == 2: if os.path.isdir(sys.argv[1]): file_directory = sys.argv[1] else: print('ERROR: "{0}" is not a directory.'.format(sys.argv[1])) exit(1) else: # Set file directory to CWD file_directory = os.getcwd() print('\n -- Looking for Required Files in "{0}" -- \n'.format(file_directory)) # Set the number of processed files equal to zero print_files.counter = 0 # Start Processing print_files(file_directory) # We are done. Exit now.

3条回答

网友

1楼 · 编辑于 2024-05-23 17:01:49

用这条线修好了

print hashlib.md5(open('{0}'.format(filepath)).read()).hexdigest()

我不是在看文件，只是路过而已哈希库.md5. 感谢马特的洞察力。在

网友

2楼 · 编辑于 2024-05-23 17:01:49

我建议您不要递归地解决这个问题，而是使用os.walk()遍历目录结构。以下代码可能是print_files函数的主体。在

file_directory = os.path.abspath(file_directory)
paths_to_hash = []

for root, dirs, filenames in os.walk(file_directory, topdown=False):
    for i, dir in enumerate(dirs):
        for filename in filenames[i]:
            if filenames[:2] == '10':
                paths_to_hash += [os.path.abspath('{0}/{1}/{2}'.format(root, dir, filename)]

for path in paths_to_hash:
    hash = hashlib.md5(open(path, 'rb').read()).digest())
    print 'hash: {0} for path: {1}'.format(hash, path)

网友

3楼 · 编辑于 2024-05-23 17:01:49

打印哈希器的行应该是：

print('{0}'.format(hasher.hexdigest()))

相关问题更多 >

编程相关推荐

热门问题

热门文章