2024-09-03 18:15:22 +08:00

217 lines
8.2 KiB
Python

# coding=utf-8
# !/usr/bin/python
import sys
import re
sys.path.append('..')
from base.spider import Spider
import urllib.parse
class Spider(Spider): # 元类 默认的元类 type
def getName(self):
return "创艺影视"
def init(self, extend=""):
print("============{0}============".format(extend))
pass
def homeContent(self, filter):
result = {}
cateManual = {
"电影": "1",
"剧集": "2",
"动漫": "4",
"综艺": "3",
"纪录片": "30"
}
classes = []
for k in cateManual:
classes.append({
'type_name': k,
'type_id': cateManual[k]
})
result['class'] = classes
if (filter):
result['filters'] = self.config['filter']
return result
def homeVideoContent(self):
result = {
'list': []
}
return result
def categoryContent(self, tid, pg, filter, extend):
result = {}
header = {"User-Agent": "Mozilla/5.0 (Linux; Android 4.4.2; Nexus 4 Build/KOT49H) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/34.0.1847.114 Mobile Safari/537.36"}
url = 'https://www.30dian.cn/vodtype/{0}-{1}.html'.format(tid, pg)
rsp = self.fetch(url,headers=header)
root = self.html(self.cleanText(rsp.text))
aList = root.xpath("//div[@class='myui-panel myui-panel-bg clearfix']/div/div/ul/li")
videos = []
for a in aList:
name = a.xpath('./div/a/@title')[0]
pic = a.xpath('./div/a/@data-original')[0]
mark = a.xpath("./div/a/span/span[@class='tag']/text()")[0]
sid = a.xpath("./div/a/@href")[0].replace("/", "").replace("voddetail", "").replace(".html", "")
videos.append({
"vod_id": sid,
"vod_name": name,
"vod_pic": pic,
"vod_remarks": mark
})
result['list'] = videos
result['page'] = pg
result['pagecount'] = 999
result['limit'] = 5
result['total'] = 9999
return result
def detailContent(self, array):
tid = array[0]
url = 'https://www.30dian.cn/voddetail/{0}.html'.format(tid)
header = {"User-Agent": "Mozilla/5.0 (Linux; Android 4.4.2; Nexus 4 Build/KOT49H) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/34.0.1847.114 Mobile Safari/537.36"}
rsp = self.fetch(url,headers=header)
root = self.html(self.cleanText(rsp.text))
divContent = root.xpath("//div[@class='col-lg-wide-75 col-md-wide-7 col-xs-1 padding-0']")[0]
title = divContent.xpath(".//div[@class='myui-content__detail']/h1/text()")[0]
pic = divContent.xpath(".//div[@class='myui-content__thumb']/a/img/@data-original")[0]
det = divContent.xpath(".//div[@class='col-pd text-collapse content']/span[@class='data']")[0]
if det.text is None:
detail = det.xpath(".//p/text()")[0]
else:
detail = det.text
vod = {
"vod_id": tid,
"vod_name": title,
"vod_pic": pic,
"type_name": "",
"vod_year": "",
"vod_area": "",
"vod_remarks": "",
"vod_actor": "",
"vod_director": "",
"vod_content": detail
}
infoArray = divContent.xpath(".//div[@class='myui-content__detail']/p[contains(@class,'data')]")
for info in infoArray:
content = info.xpath('string(.)')
flag = "分类" in content
if flag == True:
infon = content.replace("\t","").replace("\n","").strip().split('\r')
for inf in infon:
if inf.startswith('分类'):
vod['type_name'] = inf.replace("分类:", "")
if inf.startswith('地区'):
vod['vod_area'] = inf.replace("地区:", "")
if inf.startswith('年份'):
vod['vod_year'] = inf.replace("年份:", "")
if content.startswith('主演'):
vod['vod_actor'] = content.replace("\xa0", "/").replace("主演:", "").strip('/')
if content.startswith('更新'):
vod['vod_remarks'] = content.replace("更新:", "")
if content.startswith('导演'):
vod['vod_director'] = content.replace("\xa0", "").replace("导演:", "").strip('/')
vod_play_from = '$$$'
playFrom = []
vodHeader = divContent.xpath(".//div[@class='myui-panel_hd']/div/ul/li/a[contains(@href,'playlist')]/text()")
for v in vodHeader:
playFrom.append(v.replace(" ", ""))
vod_play_from = vod_play_from.join(playFrom)
vod_play_url = '$$$'
playList = []
vodList = divContent.xpath(".//div[contains(@id,'playlist')]")
for vl in vodList:
vodItems = []
aList = vl.xpath('./ul/li/a')
if len(aList) <= 0:
name = '无法找到播放源'
tId = '00000'
vodItems.append(name + "$" + tId)
else:
for tA in aList:
href = tA.xpath('./@href')[0]
name = tA.xpath("./text()")[0].replace(" ", "")
tId = self.regStr(href, '/vodplay/(\\S+).html')
vodItems.append(name + "$" + tId)
joinStr = '#'
joinStr = joinStr.join(vodItems)
playList.append(joinStr)
vod_play_url = vod_play_url.join(playList)
vod['vod_play_from'] = vod_play_from
vod['vod_play_url'] = vod_play_url
result = {
'list': [
vod
]
}
return result
def searchContent(self, key, quick):
url = 'https://www.30dian.cn/vodsearch/-------------.html?wd={0}'.format(key)
header = {
"User-Agent": "Mozilla/5.0 (Linux; Android 4.4.2; Nexus 4 Build/KOT49H) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/34.0.1847.114 Mobile Safari/537.36"}
rsp = self.fetch(url, headers=header)
root = self.html(self.cleanText(rsp.text))
aList = root.xpath("//ul[contains(@class,'myui-vodlist__media clearfix')]/li")
videos = []
for a in aList:
name = a.xpath(".//div[@class='detail']/h4/a/text()")[0]
pic = a.xpath(".//a[contains(@class,'myui-vodlist__thumb')]//@data-original")[0]
mark = a.xpath(".//span[@class='tag']/text()")[0]
sid = a.xpath(".//div[@class='detail']/h4/a/@href")[0]
sid = self.regStr(sid,'/voddetail/(\\S+).html')
videos.append({
"vod_id": sid,
"vod_name": name,
"vod_pic": pic,
"vod_remarks": mark
})
result = {
'list': videos
}
return result
def playerContent(self, flag, id, vipFlags):
result = {}
header = {
"User-Agent": "Mozilla/5.0 (Linux; Android 4.4.2; Nexus 4 Build/KOT49H) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/34.0.1847.114 Mobile Safari/537.36"}
if id == '00000':
return {}
url = 'https://www.30dian.cn/vodplay/{0}.html'.format(id)
rsp = self.fetch(url,headers=header)
root = self.html(self.cleanText(rsp.text))
scripts = root.xpath("//div[@class='embed-responsive clearfix']/script[@type='text/javascript']/text()")[0]
ukey = re.findall(r"url(.*)url_next", scripts)[0].replace('"', "").replace(',', "").replace(':', "")
purl = urllib.parse.unquote(ukey)
result["parse"] = 0
result["playUrl"] = ''
result["url"] =purl
result["header"] = {"User-Agent": "Mozilla/5.0 (Windows NT 10.0; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/86.0.4240.198 Safari/537.36"}
return result
config = {
"player": {},
"filter": {}
}
header = {}
def isVideoFormat(self, url):
pass
def manualVideoCheck(self):
pass
def localProxy(self, param):
action = {
'url': '',
'header': '',
'param': '',
'type': 'string',
'after': ''
}
return [200, "video/MP2T", action, ""]