Update 一锅烩.py

2024-08-26 10:57:56 +08:00
parent 345cca0eac
commit 97a0494e63
1 changed files with 9 additions and 11 deletions
@@ -254,24 +254,22 @@ if __name__ == "__main__":
 print(f"文件已过滤完成")


-#################文本排序
-# 打开原始文件读取内容,并写入新文件
-with open('2.txt', 'r', encoding='utf-8') as file:
+import re
+from pypinyin import lazy_pinyin
+# 打开一个utf-8编码的文本文件
+with open("2.txt", "r", encoding="utf-8") as file:
+    # 读取所有行并存储到列表中
    lines = file.readlines()
-# 定义一个函数,用于提取每行的第一个数字
+# 定义一个函数，用于提取每行的第一个数字
 def extract_first_number(line):
    match = re.search(r'\d+', line)
    return int(match.group()) if match else float('inf')
-# 对列表中的行进行排序
-# 按照第一个数字的大小排列,如果不存在数字则按中文拼音排序
+# 对列表中的行进行排序，按照第一个数字的大小排列，其余行按中文排序
 sorted_lines = sorted(lines, key=lambda x: (not 'CCTV' in x, extract_first_number(x) if 'CCTV' in x else lazy_pinyin(x.strip())))
-# 将排序后的行写入新的utf-8编码的文本文件,文件名基于原文件名
-output_file_path = "sorted_" + os.path.basename(file_path)
-# 写入新文件
-with open('2.txt', "w", encoding="utf-8") as file:
+# 将排序后的行写入新的utf-8编码的文本文件
+with open("2.txt", "w", encoding="utf-8") as file:
    for line in sorted_lines:
        file.write(line)
-print(f"文件已排序并保存为: {output_file_path}")