获得以下信息:“5.1 HV:/戴手套的门将不能系鞋带的体育精神,值得尊敬% meets football% football% wonderful进球%意甲% only football is not https://v.douyin.com/ eDFd28P/复制此链接,打开抖音搜索,直接观看视频!” 通过regular获取消息中的地址: share_url='5.1 HV:/ 守门员戴手套没法系鞋带这种体育精神,值得尊敬%遇见足球 %足球 %精彩进球 %意甲 %唯有足球不 https://v.douyin.com/eDFd28P/ 复制此链接,打开Dou音搜索,直接观看视频!'
short_url = re.findall('(https?://[^\s]+)', share_url)[0]
访问该地址以分析返回的数据 访问短连接后,请求的地址将变成如下所示 逐个过滤返回的数据,发现这个连接可以直接访问视频 重组请求的地址以获得源视频的地址: headers = {
"user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/90.0.4430.93 Safari/537.36",
}
# 通过分享连接获取跳转的地址
url = requests.get(url=short_url,headers=headers).url
# 通过跳转的地址找到item_id
item_id = re.findall('https://www.iesdouyin.com/share/video/(\d+)',url)[0]
# 请求地址获取数据
rel_url = requests.get(url="https://www.iesdouyin.com/web/api/v2/aweme/iteminfo/?item_ids="+item_id,headers=headers).text
# 筛出视频地址
video_rul = json.loads(rel_url)['item_list'][0]['video']['play_addr']['url_list'][0]
如何去除水印 视频地址可以通过以上步骤获取:https://aweme.snssdk.com/aweme/v1/playwm/?video_id=v0300fg10000c29ouk4guk3mmkooa0r0&ratio=720p&line=0将playwm替换为play,得到没有水印的地址
video_rul = json.loads(rel_url)['item_list'][0]['video']['play_addr']['url_list'][0].replace('/playwm/', '/play/')
完整代码
import requests
import re
import json
down_load_path = 'E:\下载的MP4\\'
class D_y():
headers = {
"user-agent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/90.0.4430.93 Safari/537.36",
}
def __init__(self,share_url):
self.share_url = share_url
def get_rel_url(self):
# short_url = re.findall('(https?://[^\s]+)', self.share_url)[0]
short_url = re.findall('(http[|s]?://[^\s]*/)', self.share_url)[0]
url = requests.get(url=short_url, headers=self.headers).url
# item_id = re.findall('https://www.iesdouyin.com/share/video/(\d+)', url)[0]
item_id = url.split('/')[5]
rel_url = requests.get(url="https://www.iesdouyin.com/web/api/v2/aweme/iteminfo/?item_ids=" + item_id,headers=self.headers).text
video_rul = json.loads(rel_url)['item_list'][0]['video']['play_addr']['url_list'][0].replace('/playwm/','/play/')
video = requests.get(url=video_rul,headers=self.headers).content
video_name = json.loads(rel_url)['item_list'][0]['share_info']['share_title'].split('#')[0].split('@')[0].replace(' ','')
if not os.path.exists(down_load_path):
os.mkdir(down_load_path)
with open(down_load_path+str(video_name)+'.mp4','wb') as f:
f.write(video)
f.close()
print("【抖音短视频】: {}.mp4 无水印视频下载完成!".format(video_name))
if __name__ == '__main__':
a = input("url:")
D_y(a).get_rel_url()
|