python抓取视频真实地址_快手批量获取真实地址python
import requests
from bs4 import BeautifulSoup
import re
import xlrd
import xlwt
class KSNoMark():
# 忽略警告代碼
requests.packages.urllib3.disable_warnings()
def GetShareUrl(self):
try:
# 打開(kāi)Excel表格
wb = xlrd.open_workbook('分享鏈接.xlsx')
# 獲取當(dāng)前正在顯示的sheet
sheet = wb.sheet_by_name('url')
urls = [(sheet.cell_value(i, 0))for i in range(1, sheet.nrows)]
while '' in urls:
urls.remove('')
except FileNotFoundError:
print("分享鏈接.xlsx文件不存在")
return urls
def GetRealUrl(self):
headers = {
'User-Agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 13_2_3 like Mac OS X) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/13.0.3 Mobile/15E148 Safari/604.1',
'Cookie': 'did=web_e4581e2dbe33aae5eac3d9fdf8b12566;',
}
urls = self.GetShareUrl()
# 創(chuàng)建一個(gè)workbook設(shè)置編碼
workbook = xlwt.Workbook(encoding='utf-8')
# 創(chuàng)建一個(gè)worksheet
worksheet = workbook.add_sheet('realLinks')
row_num = 0
for url in urls:
worksheet.write(row_num, 0, url)
response = requests.get(url, headers=headers, allow_redirects=False,verify=False)
share_url = response.headers['Location']
share_response = requests.get(share_url,headers=headers,verify=False).text
# 通過(guò)BeautifulSoup提取無(wú)水印播放地址字符串
soup = BeautifulSoup(share_response,'lxml')
noWaterMarkVideo = soup.find(attrs={'id': 'hide-pagedata'}).attrs['data-pagedata']
try:
# 正則處理字符串獲取真實(shí)地址
pattern = re.compile('\"srcNoMark\":"(.*?)"},',re.S)
real_url = re.findall(pattern,noWaterMarkVideo)[0]
worksheet.write(row_num, 1, real_url)
except Exception as e:
print(e)
pass
row_num += 1
# 保存
workbook.save('快手視頻真實(shí)地址.xls')
continue
if __name__ == '__main__':
KSNoMark = KSNoMark()
KSNoMark.GetRealUrl()
print("快手真實(shí)地址采集完成")
表格名稱:分享鏈接.xlsx
sheet名稱:url
第一列第一行:分享鏈接
第一列 第2-n行:需要解析的分享視頻地址
總結(jié)
以上是生活随笔為你收集整理的python抓取视频真实地址_快手批量获取真实地址python的全部?jī)?nèi)容,希望文章能夠幫你解決所遇到的問(wèn)題。
- 上一篇: CSS3动画animation认识和An
- 下一篇: java积累(一)------后端---