1028 dokiss
9 months ago
1 changed files with 255 additions and 0 deletions
@ -0,0 +1,255 @@ |
|||
#coding=utf-8 |
|||
#!/usr/bin/python |
|||
import sys |
|||
sys.path.append('..') |
|||
from base.spider import Spider |
|||
import json |
|||
import base64 |
|||
import re |
|||
import math |
|||
import time |
|||
import uuid |
|||
import hashlib |
|||
from urllib import request, parse |
|||
import urllib |
|||
import urllib.request |
|||
|
|||
class Spider(Spider): # 元类 默认的元类 type |
|||
def getName(self): |
|||
return "1905电影" |
|||
def init(self,extend=""): |
|||
print("============{0}============".format(extend)) |
|||
pass |
|||
def isVideoFormat(self,url): |
|||
pass |
|||
def manualVideoCheck(self): |
|||
pass |
|||
def homeContent(self,filter): |
|||
result = {} |
|||
cateManual = { |
|||
"电影": "n_1", |
|||
"微电影":"n_1_c_922", |
|||
"系列电影":"n_2", |
|||
"纪录片":"c_927", |
|||
"晚会":"n_1_c_586", |
|||
"独家":"n_1_c_178", |
|||
"综艺":"n_1_c_1024" |
|||
# ,"体育":"n_1_c_1053" |
|||
} |
|||
classes = [] |
|||
for k in cateManual: |
|||
classes.append({ |
|||
'type_name':k, |
|||
'type_id':cateManual[k] |
|||
}) |
|||
result['class'] = classes |
|||
if(filter): |
|||
result['filters'] = self.config['filter'] |
|||
return result |
|||
def homeVideoContent(self): |
|||
url = 'https://www.1905.com/vod/cctv6/lst/' |
|||
rsp = self.fetch(url, headers=self.header) |
|||
html = self.html(rsp.text) |
|||
aList = html.xpath("//div[@class='grid-2x']/a") |
|||
videos = self.custom_list(aList=aList) |
|||
result = { |
|||
'list':videos |
|||
} |
|||
return result |
|||
def categoryContent(self,tid,pg,filter,extend): |
|||
result = {} |
|||
videos=[] |
|||
by='/o1p' |
|||
if 'by' in extend.keys(): |
|||
by='/{0}p'.format(extend['by']) |
|||
url = 'https://www.1905.com/vod/list/{0}{2}{1}.html'.format(tid, pg,by) |
|||
rsp = self.fetch(url, headers=self.header) |
|||
HtmlTxt=rsp.text |
|||
html = self.html(HtmlTxt) |
|||
aList = html.xpath("//section[contains(@class,'search-list')]/div/a" if tid != u'n_2' else "//div[@class='mod']/div[1]/a") |
|||
videos = self.custom_list(aList=aList) |
|||
limit = len(aList) |
|||
result['list'] = videos |
|||
result['page'] = pg |
|||
result['pagecount'] = 100 |
|||
result['limit'] = limit |
|||
result['total'] = 100 * limit |
|||
return result |
|||
def detailContent(self,array): |
|||
result = {} |
|||
aid = array[0] |
|||
vodItems=[] |
|||
playList=[] |
|||
vod_play_from=['1905电影',] |
|||
if aid.isdigit()==False: |
|||
rsp = self.fetch(aid, headers=self.header) |
|||
HtmlTxt=rsp.text |
|||
url=self.regStr(reg=r'<a class="iconBanner-playBtn icon-banner btn-play"\s*href="(.+?)"',src=HtmlTxt) |
|||
if url=='': |
|||
url=self.regStr(reg=r'property="og:url"\scontent="(.+?)"',src=HtmlTxt) |
|||
if len(self.regStr(reg=r'(vip.1905)',src=url))>3: |
|||
vod_play_from=['1905电影(需要vip解析)',] |
|||
aid=url |
|||
else: |
|||
aid=self.regStr(reg=r'play/(.*?)\.sh',src=url) |
|||
if aid=='': |
|||
return {'list': []} |
|||
elif aid.isdigit() and vod_play_from[0].find('需要vip解析')<0: |
|||
url = "https://www.1905.com/api/content/?callback=&m=Vod&a=getVodSidebar&id={0}&fomat=json".format(aid) |
|||
rsp = self.fetch(url, headers=self.header) |
|||
HtmlTxt=rsp.text |
|||
root = json.loads(HtmlTxt) |
|||
title = root['title'] |
|||
pic = root['thumb'] |
|||
remark = root['commendreason'] |
|||
content = root['description'] |
|||
actor = root['starring'] |
|||
direct = root['direct'] |
|||
vodItems.append(title + "$" + aid) |
|||
series = root['info']['series_data'] |
|||
series = root['info']['series_data'] |
|||
for ser in series: |
|||
vodItems.append(ser['title'] + "$" + ser['contentid']) |
|||
joinStr = '#'.join(vodItems) |
|||
playList.append(joinStr) |
|||
else: |
|||
rsp = self.fetch(array[0], headers=self.header) |
|||
HtmlTxt=rsp.text |
|||
title=self.regStr(reg=r'<div class="container-right">\s*\r*\n*\t*<h1>(.+?)<',src=HtmlTxt).replace(' ','') |
|||
pic=self.regStr(reg=r'<img class="poster" src="(.+?)"',src=HtmlTxt) |
|||
remark='' |
|||
actor='' |
|||
direct='' |
|||
content=self.regStr(reg=r'<p>(.+?)</p>',src=HtmlTxt) |
|||
vodItems.append(title + "$" + aid) |
|||
joinStr = '#'.join(vodItems) |
|||
playList.append(joinStr) |
|||
|
|||
vod = { |
|||
"vod_id":array[0], |
|||
"vod_name":title, |
|||
"vod_pic":pic, |
|||
"type_name":'', |
|||
"vod_year":"", |
|||
"vod_area":"", |
|||
"vod_remarks":remark, |
|||
"vod_actor":actor, |
|||
"vod_director":direct, |
|||
"vod_content":content |
|||
} |
|||
vod['vod_play_from'] = "$$$".join(vod_play_from) |
|||
vod['vod_play_url'] = "$$$".join(playList) |
|||
result = { |
|||
'list':[ |
|||
vod |
|||
] |
|||
} |
|||
return result |
|||
|
|||
def searchContent(self,key,quick): |
|||
url = 'https://www.1905.com/search/index-p-type-film-q-{}.html?envod=1&year=0&score=0&order=0'.format(key)#只搜索能看电影,想搜其它的可以把html之后的字符删掉 |
|||
#https://www.1905.com/search/index-p-type-all-q-{}.html |
|||
rsp = self.fetch(url, headers=self.header) |
|||
html = self.html(rsp.text) |
|||
aList = html.xpath("//div/div[contains(@class,'new_content')]/div/div/div/a") |
|||
videos = self.custom_list(aList=aList) |
|||
result = { |
|||
'list':videos |
|||
} |
|||
return result |
|||
def playerContent(self,flag,id,vipFlags): |
|||
result = {} |
|||
if flag.find('vip解析')>0: |
|||
result["parse"] = 1#0=直接播放、1=嗅探 |
|||
result["playUrl"] ='' |
|||
result["url"] = id |
|||
result['jx'] = 1#1=VIP解析,0=不解析 |
|||
result["header"] = '' |
|||
else: |
|||
nonce = int(round(time.time() * 1000)) |
|||
expiretime = nonce + 600 |
|||
uid = str(uuid.uuid4()) |
|||
playerid = uid.replace("-", "")[5:20] |
|||
signature = 'cid={0}&expiretime={1}&nonce={2}&page=https%3A%2F%2Fwww.1905.com%2Fvod%2Fplay%2F{3}.shtml&playerid={4}&type=hls&uuid={5}.dde3d61a0411511d'.format(id,expiretime,nonce,id,playerid,uid) |
|||
signature = hashlib.sha1(signature.encode()).hexdigest() |
|||
url = 'https://profile.m1905.com/mvod/getVideoinfo.php?nonce={0}&expiretime={1}&cid={2}&uuid={3}&playerid={4}&page=https%3A%2F%2Fwww.1905.com%2Fvod%2Fplay%2F{5}.shtml&type=hls&signature={6}&callback='.format(nonce,expiretime,id,uid,playerid,id,signature) |
|||
rsp = self.fetch(url, headers=self.header) |
|||
HtmlTxt=rsp.text |
|||
jo = json.loads(HtmlTxt.replace("(", "").replace(")", "")) |
|||
data = jo['data']['sign'] |
|||
sign = '' |
|||
qualityStr = '' |
|||
if 'uhd' in data.keys(): |
|||
sign = data['uhd']['sign'] |
|||
qualityStr = 'uhd' |
|||
elif 'hd' in data.keys(): |
|||
sign = data['hd']['sign'] |
|||
qualityStr = 'hd' |
|||
elif 'sd' in data.keys(): |
|||
sign = data['sd']['sign'] |
|||
qualityStr = 'sd' |
|||
host = jo['data']['quality'][qualityStr]['host'] |
|||
path = jo['data']['path'][qualityStr]['path'] |
|||
playUrl = host + sign + path |
|||
result["parse"] = 1#0=直接播放、1=嗅探 |
|||
result["playUrl"] ='' |
|||
result["url"] = playUrl |
|||
result["header"] = self.header |
|||
return result |
|||
|
|||
|
|||
config = { |
|||
"player": {}, |
|||
"filter": { |
|||
"n_1":[ |
|||
{"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]} |
|||
], |
|||
"n_1_c_922":[ |
|||
{"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]} |
|||
], |
|||
"n_2":[ |
|||
{"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]} |
|||
], |
|||
"c_927":[ |
|||
{"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]} |
|||
], |
|||
"n_1_c_586":[ |
|||
{"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]} |
|||
], |
|||
"n_1_c_178":[ |
|||
{"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]} |
|||
], |
|||
"n_1_c_1024":[ |
|||
{"key":"by","name":"排序:","value":[{"n":"默认(最新)","v":"o1"},{"n":"最热","v":"o3"},{"n":"好评","v":"o4"}]} |
|||
] |
|||
} |
|||
} |
|||
header = { |
|||
'User-Agent': 'Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/117.0.0.0 Safari/537.36 Edg/117.0.2045.43', |
|||
'Referer': 'https://www.1905.com/vod/list/n_1/o3p1.html', |
|||
'Accept': 'text/html,application/xhtml+xml,application/xml;q=0.9,image/webp,image/apng,*/*;q=0.8,application/signed-exchange;v=b3;q=0.7' |
|||
} |
|||
def localProxy(self,param): |
|||
return [200, "video/MP2T", action, ""] |
|||
#-----------------------------------------------自定义函数----------------------------------------------- |
|||
#分类取结果 |
|||
def custom_list(self,aList): |
|||
videos = [] |
|||
for a in aList: |
|||
img=a.xpath('./img/@src')[0] |
|||
title=a.xpath('./img/@alt')[0] |
|||
url=a.xpath("./@href")[0] |
|||
if url.find('vip.1905')>1:#可以除掉 |
|||
continue |
|||
if self.regStr(reg=r'(play)',src=url)=='': |
|||
vod_id="{0}".format(url) |
|||
else: |
|||
id=self.regStr(reg=r'play/(.*?)\.sh',src=url) |
|||
vod_id="{0}".format(id) |
|||
videos.append({ |
|||
"vod_id":vod_id, |
|||
"vod_name":title, |
|||
"vod_pic":img, |
|||
"vod_remarks":'' |
|||
}) |
|||
return videos |
Loading…
Reference in new issue