Update 网络收集.py

This commit is contained in:
frxz751113
2024-09-24 23:16:02 +08:00
committed by GitHub
parent 7de71d46d7
commit 8635e4329a
+3 -3
View File
@@ -361,7 +361,7 @@ with open('2.txt', 'r', encoding='utf-8') as file:
lines = file.readlines() lines = file.readlines()
# 创建或打开一个输出文件用于写入处理后的数据 # 创建或打开一个输出文件用于写入处理后的数据
with open('2.txt', 'w', encoding='utf-8') as outfile: with open('校对文件.txt', 'w', encoding='utf-8') as outfile:
for line in lines: for line in lines:
# 首先检查行是否包含任何提取关键词 # 首先检查行是否包含任何提取关键词
if any(keyword in line for keyword in extract_keywords): if any(keyword in line for keyword in extract_keywords):
@@ -411,7 +411,7 @@ def parse_file(input_file_path, output_file_name):
output_file.write(line + '\n') output_file.write(line + '\n')
output_file.write('\n') # 在每个小段后添加一个空行作为分隔 output_file.write('\n') # 在每个小段后添加一个空行作为分隔
# 调用函数并传入文件路径和输出文件名 # 调用函数并传入文件路径和输出文件名
parse_file('2.txt', '2.txt') parse_file('校对文件.txt', '校对文件.txt')
@@ -421,7 +421,7 @@ from tqdm import tqdm
import os import os
# 存储文件路径 # 存储文件路径
file_path = "2.txt" file_path = "校对文件.txt"
output_file_path = "网络收集.txt" output_file_path = "网络收集.txt"
def get_ip_key(url): def get_ip_key(url):