Update 网络收集.py
This commit is contained in:
+3
-3
@@ -363,15 +363,15 @@ keywords = ['1905', '凤凰卫视', '人间卫视', '亚洲卫视', '香港卫
|
|||||||
excluded_pattern = '|'.join(excluded_keywords)
|
excluded_pattern = '|'.join(excluded_keywords)
|
||||||
# 将关键词列表转换为正则表达式模式
|
# 将关键词列表转换为正则表达式模式
|
||||||
pattern = '|'.join(keywords)
|
pattern = '|'.join(keywords)
|
||||||
with open('2.txt', 'r', encoding='utf-8') as file, open('2.txt', 'w', encoding='utf-8') as 2:
|
with open('2.txt', 'r', encoding='utf-8') as file, open('2.txt', 'w', encoding='utf-8') as a:
|
||||||
#2.write('央视频道,#genre#\n')
|
#a.write('央视频道,#genre#\n')
|
||||||
for line in file:
|
for line in file:
|
||||||
if 'genre' not in line:
|
if 'genre' not in line:
|
||||||
# 使用正则表达式检查该行是否不包含任何排除关键词
|
# 使用正则表达式检查该行是否不包含任何排除关键词
|
||||||
if not re.search(excluded_pattern, line):
|
if not re.search(excluded_pattern, line):
|
||||||
# 如果行中有任意关键字
|
# 如果行中有任意关键字
|
||||||
if re.search(pattern, line):
|
if re.search(pattern, line):
|
||||||
2.write(line)
|
a.write(line)
|
||||||
|
|
||||||
###############################################################
|
###############################################################
|
||||||
import re
|
import re
|
||||||
|
|||||||
Reference in New Issue
Block a user