计算机视觉

统计数据集标签中目标数量

2025-05-12 1 min read 132 chars
import os

def count_non_empty_lines_in_folder(folder_path):
    total_lines = 0
    
    # 遍历文件夹下的所有文件
    for root, dirs, files in os.walk(folder_path):
        for file in files:
            if file.endswith('.txt'):
                file_path = os.path.join(root, file)
                with open(file_path, 'r', encoding='utf-8') as f:
                    # 统计非空行
                    non_empty_lines = [line for line in f if line.strip() != '']
                    total_lines += len(non_empty_lines)
    
    return total_lines

# 定义train和test文件夹的路径
train_folder = 'labels/train'
test_folder = 'labels/test'

# 统计每个文件夹中非空行的数量
train_lines = count_non_empty_lines_in_folder(train_folder)
test_lines = count_non_empty_lines_in_folder(test_folder)

print(f"Train文件夹中目标的总数: {train_lines}")
print(f"Test文件夹中目标的总数: {test_lines}")

Comments.