import requests
import re
import json
HEADERS = {
'user-agent': 'Mozilla/5.0 (Macintosh; Intel Mac OS X 10_14_3) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/74.0.3729.131 Safari/537.36'
}
'''
破解优酷VIP视频
'''
class web():
def __init__(self):
self.api = "http://y.mt2t.com/lines?url=" # 在线解析视频平台
self.url = "https://v.youku.com/v_show/id_XNDEwNTMzMzM2OA==.html" # 需要解析的VIP视频网站
self.name = None
self.post_url1 = "http://y.mt2t.com/lines/getdata" # 解析平台上获取的1号端口,用于收集video的地址
self.post_url2 = 'http://y2.mt2t.com:91/ifr/api' # 解析平台上获取的m3u8视频段提供端口
# 发送解析请求通过re正则获取key的值
def find_key(self):
# 通过访问解析平台api与需要解析的VIP视频网站
res = requests.get(self.api + self.url)
# 获取文本
html = res.text
key = re.search(r'key:"(.*?)"', html).group(1) # 通过解析平台找到ajax请求中的data中的key
# print(key)
return key
# 对原来的url进行修改,得出完整的url
def url_spilt(self, url):
# 将拿到的viedo视频段进行转码,再做切分获得类型和所需的data体中的视频地址
'''
<script type="text/javascript">
var url="usZehnz38ibymr+ghLS1yGrU7tBqDcTQETbMfdhmceJxo2Y1QIbrmjQElPgxaXjmVIzB0qqL9GoUYCXdSd8GYA==";
var type="m3u8";
var api="/ifr/api";
var device="";
player(api,url,type,device,0);
</script>
# 访问这个链接,内部会有上述ajax请求获取视频
usZehnz38ibymr+ghLS1yGrU7tBqDcTQETbMfdhmceJxo2Y1QIbrmjQElPgxaXjmVIzB0qqL9GoUYCXdSd8GYA==
http://y2.mt2t.com:91/ifr?url=usZehnz38ibymr%2bghLS1yGrU7tBqDcTQETbMfdhmceJxo2Y1QIbrmjQElPgxaXjmVIzB0qqL9GoUYCXdSd8GYA%3d%3d&type=m3u8'
'''
# 对列表中的第一个url里面的字符进行特换
# 有些视频的链接是有 %2f 需要替换成 /
url_param = url.split("?url=")[1].split("&")[0].replace("%2b", "+").replace("%3d", "=").replace("%2f", "/")
# 获取 m3u8
movie_type = url.split("type=")[1]
return url_param, movie_type
# 采集视频
def get_playlist(self):
'''# 飞驰人生:
<script type="text/javascript">
$(document).ready(
function () {
$.ajax({
type: "post",
dataType: "json",
url: "/lines/getdata", # 1.需要获取的url http://y.mt2t.com/lines/getdata
# 2.获取key值
data:{url:"http://v.youku.com/v_show/id_XNDEwNTMzMzM2OA==.html",type:"",key:"a0b923820dcc509a"},
success:ShowMenu
});}
);
</script>
'''
# 调用find_key方法获取vip视频中data的key
key = self.find_key()
data = {
"url": self.url,
"key": key,
}
# 获取VIP所需的KEY之后向1号端口发送data包来获取所需的viedo视频段
html = requests.post(self.post_url1, data=data).text
dic = json.loads(html)
print(dic)
'''
# 往解析平台发送post请求获取的是一个json数据,里面有整部电影分切成的几个视频链接
# 第一个链接就是全部的视频了!!! 凡是m3u8后缀的链接都隐藏着视频
[{'Url': 'http://y2.mt2t.com:91/ifr?url=usZehnz38ibymr%2bghLS1yGrU7tBqDcTQETbMfdhmceJxo2Y1QIbrmjQElPgxaXjmVIzB0qqL9GoUYCXdSd8GYA%3d%3d&type=m3u8',
'Video_type': '1',
'Vid': None,
'Scheme': 'auto'},
{'Url': 'http://y2.mt2t.com:91/ifr?url=usZehnz38ibymr%2bghLS1yBx%2fLeW6zBPvlnirzwVAPb22uUqY7Lurs2njqvy41H%2fP56dP%2bJxZNyUrXMTBI9wDCg%3d%3d',
'Video_type': '1',
'Vid': None, 'Scheme': 'auto'},
{'Url': 'http://y2.mt2t.com:91/ifr?url=a6tgiq6l1aQQZzObpXfOZ8U46WROtjYnUG5ZzktCdBFLPGVOTRFWXddcBGY61OgLBMh9uvHbmq7StHt5J1YqsQ%3d%3d',
'Video_type': '1',
'Vid': None,
'Scheme': 'auto'},
{'Url': 'http://y2.mt2t.com:91/ifr?url=KuT7Bg63M9X8euMJDPneBFvHMMyUaXi9G3Pu5CiJRWLODtsR9maZGFrrtetCrKTE',
'Video_type': '1',
'Vid': None,
'Scheme': 'auto'},
{'Url': 'http://y2.mt2t.com:91/ifr?url=HAoUzVAntrQdCkvIryzh%2bCLfbHCa6F1N%2fdmTpLCjBpzarEGkP6zvW36iGCLJ1Qt9',
'Video_type': '1',
'Vid': None,
'Scheme': 'auto'},
{'Url': 'http://y2.mt2t.com:91/ifr?url=4v6ceQdhfTwrhJ5xfngkjQST%2fCa1dsHxOZXRmFQSiLRQIv6FZ58v%2fW1%2b53Zkfz0uy30gLudsy1Cd9GAYjVudWp5x4z8EBN7C1NDeLNGpUmE%3d',
'Video_type': '1',
'Vid': None,
'Scheme': 'auto'},
{'Url': 'http://y2.mt2t.com:91/ifr?url=4v6ceQdhfTwrhJ5xfngkjQST%2fCa1dsHxOZXRmFQSiLRQIv6FZ58v%2fW1%2b53Zkfz0utK4DajZZFp2swCbcqN1J3w%3d%3d',
'Video_type': '1',
'Vid': None,
'Scheme': 'auto'}]
'''
# 把列表中的第一个视频链接去做处理,获取完整的url
url_param, type = self.url_spilt(dic[0]["Url"])
'''
<script type="text/javascript">
var url="usZehnz38ibymr+ghLS1yGrU7tBqDcTQETbMfdhmceJxo2Y1QIbrmjQElPgxaXjmVIzB0qqL9GoUYCXdSd8GYA==";
var type="m3u8";
var api="/ifr/api";
var device="";
player(api,url,type,device,0);
</script>
'''
# 往此地址发送ajax请求获取视频数据
res = requests.post(self.post_url2,
data={
"url": url_param,
"type": '',
"from": "mt2t.com",
"device": "",
"up": 0
})
# 返回json视频数据
play = json.loads(res.text)
self.save_movie(play)
def save_movie(self, play):
with open('%s.mp4' % self.name, 'wb') as f:
f.write(play)
# if __name__ == '__main__':
# vip = web()
# vip.get_playlist()
'''
批量获取电影所有的名称与链接.
电影详情接口:
https://list.youku.com/category/page?c=96&pt=2&type=show&p=1
https://list.youku.com/category/page?c=96&pt=2&type=show&p=2
https://list.youku.com/category/page?c=96&pt=2&type=show&p=3
https://list.youku.com/category/page?c=96&pt=2&type=show&p=4
https://list.youku.com/category/page?c=96&pt=2&type=show&p=5
每个接口的所有详情信息:
{'success': True,
'message': '',
'data': # 数据
[{'summaryType': 'UPDATE_STATUS',
'access': 'allow',
'type': 'vertical',
'img': '//r1.ykimg.com/051640005C8B7F56859B5D5D300E06C1',
'summary': '正片',
'title': '篮球冠军', # 电影名称
'subTitle': '傲慢教练与怪异球队',
'videoId': 'XNDE4MzY4NjUzNg==',
'videoLink': '//v.youku.com/v_show/id_XNDE4MzY4NjUzNg==.html'} # 电影详情链接
...
]
vip电影链接div:
<div id="dramaFixedWrap" class="drama-fixed-wrap">
<div class="item item-cover item-cover-fixed active" item-id="item_XNDE4MzY4NjUzNg==" title="篮球冠军">
<a href="//v.youku.com/v_show/id_XNDE4MzY4NjUzNg==.html?&s=eccc9254a71842e09356">
# 需要解析的链接
<a href="(.*?)">
<div class="cover"><img src="https://vthumb.ykimg.com/054102015CDD1E950000017A690856DF"></div>
<div class="title">篮球冠军</div>
</a>
</div>
<i class="scroll-fixed"></i>
</div>
'''
import requests
# 获取全部电影主页的json数据
def parse_index(url):
res = requests.get(url)
data = res.json()
return data.get('data')
# 保留 电影名称 与 电影链接 放进生成器内
def get_vip_movie(datas):
# print(data)
for data in datas:
# print(data)
# 电影名称
title = data.get('title')
# 拼接完整的电影链接
video_link = 'https:' + data.get('videoLink')
yield title, video_link
# url = 'https://list.youku.com/category/show/c_96_pt_2.html?spm=a2ha1.12701310.app.5~5!2~5~5~5~DL!6~DD~A!3'
if __name__ == '__main__':
base_url = 'https://list.youku.com/category/page?c=96&pt=2&type=show&p={}'
vip = web()
for line in range(1, 11):
url = base_url.format(line)
# 解析电影的每一个接口,获取所有电影接口的json数据
data = parse_index(url)
# 接收到N个电影名字与电影链接的生成器
vip_movies = get_vip_movie(data)
# print(vip_movies)
for movies in vip_movies:
# 电影名称与电影url
name, link = movies
vip.name = name
vip.url = link
vip.get_playlist()
print(name, link)
# parse_link(name, link)