python3.7保存_python3.7爬取墨菲定律保存在本地txt
#!/usr/local/bin/python3.7
# -*- coding: utf-8 -*-
# @Time: 2019/07/15
# @Function 獲取在線文本內容
import requests
from bs4 import BeautifulSoup
import re
import codecs
url = 'https://www.shuhaige.com/7518/'
header = {
'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/64.0.3282.140 Safari/537.36',
'Origin': 'https://www.shuhaige.com',
'Host': 'www.shuhaige.com'
}
# 設置代理服務器
proxies = {
'http:': 'http://121.232.146.184',
'https:': 'https://144.255.48.197'
}
def getContent():
contents = requests.get(url, headers=header).text
html = BeautifulSoup(contents, 'html.parser')
lists = html.select('dl')[0].select('a')
for list in lists:
itemUrl = f'https://www.shuhaige.com{list["href"]}'
itemContent = requests.get(itemUrl, headers=header).text
itemHtml = BeautifulSoup(itemContent, 'html.parser')
saveToTxt(itemHtml.select('div .content')[0], list.string)
# 寫入文本文件
def saveToTxt(comments, title):
commentsList = ''
for item in comments:
comment_info = f'{item}'.replace(f'
', '')
comment_info = re.sub(f'
.*
', '', comment_info)commentsList += comment_info
with codecs.open(f'MoFeiDingLv/{title}.txt', 'w', encoding='utf-8') as file:
file.writelines(commentsList)
print(f'{title}寫入文件成功!')
getContent()
總結
以上是生活随笔為你收集整理的python3.7保存_python3.7爬取墨菲定律保存在本地txt的全部內容,希望文章能夠幫你解決所遇到的問題。
- 上一篇: 柠檬柚子茶的功效与作用、禁忌和食用方法
- 下一篇: 蛇六谷的功效与作用、禁忌和食用方法