Update GAT.py

This commit is contained in:
frxz751113
2024-10-03 03:38:52 +08:00
committed by GitHub
parent 5dda56c5d1
commit 31d5f23ad4
+2 -1
View File
@@ -25,6 +25,7 @@ with open(output_file, 'w', encoding='utf-8') as f:
soup = BeautifulSoup(response.text, 'html.parser') soup = BeautifulSoup(response.text, 'html.parser')
text_content = soup.get_text() text_content = soup.get_text()
f.write(text_content + '\n') f.write(text_content + '\n')
print(f"{keyword}获取完成")
else: else:
print(f'请求 {url} 失败,状态码:{response.status_code}') print(f'请求 {url} 失败,状态码:{response.status_code}')
time.sleep(1) # 添加 1 秒的延迟 time.sleep(1) # 添加 1 秒的延迟
@@ -57,7 +58,7 @@ with open(output_file, 'w', encoding='utf-8') as f:
try: try:
response = requests.get(url) response = requests.get(url)
if response.status_code == 200: if response.status_code == 200:
print(response.content) # 打印响应内容 print(f"{keyword}获取完成") # 打印响应内容
try: try:
soup = BeautifulSoup(response.content, 'html.parser') soup = BeautifulSoup(response.content, 'html.parser')
text_content = soup.get_text() text_content = soup.get_text()