Python：比较不同文件名的两个目录

# Define the lists which contain the filenames to compare originals = "orig-files.txt" next_step_filenames = "new-files.txt" def read_input_file(input_filename): f = open(input_filename, 'r') fr = f.readlines() f.close() return fr # Read the files with filenames and without extensions original_files = read_input_file(originals) next_step_files = read_input_file(next_step_filenames) original_files_trimmed = [] # Removing the last \n from every line for a in original_files: original_files_trimmed.append(a[:-1]) next_step_files_trimmed = [] # A list with the last -1, -2, -3 removed for i in next_step_files: next_step_files_trimmed.append(i[:-3]) Final_list = [] # List for Files who generate <3 files for m in original_files_trimmed: for n in next_step_files_trimmed: count = 0 if m in n: count =+ 1 if count < 3: Final_list.append(m) for b in Final_list: print(b)

2条回答

网友

1楼 · 编辑于 2024-04-20 04:02:14

下面是一个实现：

def updateHash(d, key):
    if key not in d.keys():
        d[key] = 3
    else:
        d[key] -= 1

originals = "orig-files.txt"
next_step_filenames = "new-files.txt"

originals_list = []
with open(originals, 'r') as f:
    originals_list = f.read().splitlines()

next_step_list = []
with open(next_step_filenames, 'r') as f:
    next_step_list = f.read().splitlines()

expected_list = []
d = {}
for orig in originals_list:
    if orig + '-1' not in next_step_list:
        updateHash(d, orig)
    if orig + '-2' not in next_step_list:
        updateHash(d, orig)
    if orig + '-3' not in next_step_list:
        updateHash(d, orig)

print d

网友

2楼 · 编辑于 2024-04-20 04:02:14

使用Counter计算文件名删去最后2个字符后的出现次数。结果counter对象可用于过滤original_files_trimmed，其中项的计数不超过3。你知道吗

示例：

from collections import Counter

original_files_trimmed = [
  'xa02-1-1-1-1',
  'xa02-1-1-1-2',
  'xa02-1-1-2-3',
  'xa02-1-3-3-3',
  'xa06-3-1-2-1',
  'xa07-1-2-1-1',
]
next_step_files_trimmed = [
  'xa02-1-1-1-1-1',
  'xa02-1-1-1-1-2',
  'xa02-1-1-1-1-3',
  'xa02-1-1-1-2-1',
  'xa02-1-1-1-2-2',
  'xa02-1-1-1-2-3',
  'xa02-1-1-2-3-1',
  'xa02-1-3-3-3-1',
  'xa02-1-3-3-3-2',
  'xa06-3-1-2-1-1',
  'xa06-3-1-2-1-2',
  'xa06-3-1-2-1-3'
]

# These next few lines diff original_files_trimmed and 
# next_step_files_trimmed using the defined rules
next_step_files_without_num = (n[:-2] for n in next_step_files_trimmed) ## trim last 2 chars    
next_step_files_without_num_cnt = Counter(next_step_files_without_num)
final_list = [
   m for m in original_files_trimmed 
   if next_step_files_without_num_cnt[m] < 3
]

print(final_list)

示例：

相关问题更多 >

编程相关推荐

热门问题

热门文章