SpacetySliceTools/tools/aceshi.py

41 lines
1.4 KiB
Python

import os
import csv
from collections import Counter
# 获取当前目录下的所有txt文件
folder_path = r'R:\TYSAR-德清院\TYSAR-条带模式(SM)\港口\20250910-不分类\C-人工检查\删除空标注' # 当前文件夹
txt_files = [f for f in os.listdir(folder_path) if f.endswith('.txt')]
print(f"找到 {len(txt_files)} 个txt文件:")
for file in txt_files:
print(f" {file}")
# 提取每个文件名的前50个字符
prefixes = [filename[:50] for filename in txt_files]
# 统计每个前缀出现的次数
prefix_counts = Counter(prefixes)
# 准备要写入CSV的数据
csv_data = [(prefix, count) for prefix, count in prefix_counts.items()]
# 将结果写入CSV文件
csv_filename = r'D:\TYSAR-德清院\unique_file_0919.csv'
with open(csv_filename, 'w', newline='', encoding='utf-8') as csvfile:
writer = csv.writer(csvfile)
writer.writerow(['文件名前50个字符', '重复次数']) # 写入表头
writer.writerows(csv_data)
print(f"\n已将结果保存到 {csv_filename}")
print("\n重复统计详情:")
for prefix, count in csv_data:
print(f" '{prefix}': {count}")
# 显示重复的文件
duplicates = [item for item in csv_data if item[1] > 1]
if duplicates:
print("\n发现的重复文件:")
for prefix, count in duplicates:
print(f" 前缀 '{prefix}' 出现了 {count}")
else:
print("\n未发现重复文件")