Update 一锅烩.py
This commit is contained in:
@@ -254,24 +254,22 @@ if __name__ == "__main__":
|
||||
print(f"文件已过滤完成")
|
||||
|
||||
|
||||
#################文本排序
|
||||
# 打开原始文件读取内容,并写入新文件
|
||||
with open('2.txt', 'r', encoding='utf-8') as file:
|
||||
import re
|
||||
from pypinyin import lazy_pinyin
|
||||
# 打开一个utf-8编码的文本文件
|
||||
with open("2.txt", "r", encoding="utf-8") as file:
|
||||
# 读取所有行并存储到列表中
|
||||
lines = file.readlines()
|
||||
# 定义一个函数,用于提取每行的第一个数字
|
||||
# 定义一个函数,用于提取每行的第一个数字
|
||||
def extract_first_number(line):
|
||||
match = re.search(r'\d+', line)
|
||||
return int(match.group()) if match else float('inf')
|
||||
# 对列表中的行进行排序
|
||||
# 按照第一个数字的大小排列,如果不存在数字则按中文拼音排序
|
||||
# 对列表中的行进行排序,按照第一个数字的大小排列,其余行按中文排序
|
||||
sorted_lines = sorted(lines, key=lambda x: (not 'CCTV' in x, extract_first_number(x) if 'CCTV' in x else lazy_pinyin(x.strip())))
|
||||
# 将排序后的行写入新的utf-8编码的文本文件,文件名基于原文件名
|
||||
output_file_path = "sorted_" + os.path.basename(file_path)
|
||||
# 写入新文件
|
||||
with open('2.txt', "w", encoding="utf-8") as file:
|
||||
# 将排序后的行写入新的utf-8编码的文本文件
|
||||
with open("2.txt", "w", encoding="utf-8") as file:
|
||||
for line in sorted_lines:
|
||||
file.write(line)
|
||||
print(f"文件已排序并保存为: {output_file_path}")
|
||||
|
||||
|
||||
|
||||
|
||||
Reference in New Issue
Block a user