This commit is contained in:
guanjihuan 2022-09-14 07:41:37 +08:00
parent 7702fd543f
commit 24e3a2c8bf
2 changed files with 42 additions and 0 deletions

View File

@ -1,3 +1,9 @@
"""
This code is supported by the website: https://www.guanjihuan.com
The newest version of this code is on the web page: https://www.guanjihuan.com/archives/25943
"""
def main():
directory = 'E:/test'
creat_necessary_file(directory)

View File

@ -0,0 +1,36 @@
"""
This code is supported by the website: https://www.guanjihuan.com
The newest version of this code is on the web page: https://www.guanjihuan.com/archives/26113
"""
# 仅支持文件名判断是否重复,不支持对文件内容的判断。
# 如需对文件名和内容都判断,需要计算文件的哈希值。这里暂时不考虑。
def main():
directory = 'E:/test'
repeated_file = find_repeated_file_with_same_filename(directory)
print(repeated_file)
# import guan
# repeated_file = guan.find_repeated_file_with_same_filename(directory)
# print(repeated_file)
def find_repeated_file_with_same_filename(directory, num=1000):
import os
from collections import Counter
file_list = []
for root, dirs, files in os.walk(directory):
for i0 in range(len(files)):
file_list.append(files[i0])
count_file = Counter(file_list).most_common(num)
repeated_file = []
for item in count_file:
if item[1]>1:
repeated_file.append(item)
return repeated_file
if __name__ == '__main__':
main()