-
Notifications
You must be signed in to change notification settings - Fork 284
Expand file tree
/
Copy pathAppFox.py
More file actions
187 lines (171 loc) · 7.95 KB
/
AppFox.py
File metadata and controls
187 lines (171 loc) · 7.95 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
"""
@header({
searchable: 1,
filterable: 1,
quickSearch: 1,
title: 'AppFox',
lang: 'hipy'
})
"""
# -*- coding: utf-8 -*-
# 本资源来源于互联网公开渠道,仅可用于个人学习爬虫技术。
# 严禁将其用于任何商业用途,下载后请于 24 小时内删除,搜索结果均来自源站,本人不承担任何责任。
try:
from base.spider import BaseSpider
except ImportError:
from t4.base.spider import BaseSpider
import re, sys, json, urllib3
urllib3.disable_warnings(urllib3.exceptions.InsecureRequestWarning)
sys.path.append('..')
class Spider(BaseSpider):
headers, host, froms, detail, custom_first, parses, custom_parses = {
'User-Agent': "Mozilla/5.0 (Linux; Android 12; SM-S9080 Build/V417IR; wv) AppleWebKit/537.36 (KHTML, like Gecko) Version/4.0 Chrome/101.0.4951.61 Safari/537.36",
'Connection': "Keep-Alive",
'Accept-Encoding': "gzip",
'Accept-Language': "zh-CN,zh;q=0.8",
'Cache-Control': "no-cache"
}, '', '', '', '', {}, {}
def init(self, extend=''):
print("============{0}============".format(extend))
ext = self.extend.strip()
if ext.startswith('http'):
host = ext
else:
arr = json.loads(ext)
host = arr['host']
self.froms = arr.get('from', '')
self.custom_parses = arr.get('parse', {})
self.custom_first = arr.get('custom_first', 0)
if not re.match(r'^https?:\/\/[a-zA-Z0-9-]+(\.[a-zA-Z0-9-]+)*(:\d+)?(\/)?$', host):
host = self.fetch(host, headers=self.headers, verify=False).json()['apiDomain']
self.host = host.rstrip('/')
def homeContent(self, filter):
if not self.host: return None
response = self.fetch(f'{self.host}/api.php/Appfox/init', headers=self.headers, verify=False).json()
classes = []
for i in response['data']['type_list']:
classes.append({'type_id': i['type_id'], 'type_name': i['type_name']})
return {'class': classes}
def homeVideoContent(self):
if not self.host: return None
response = self.fetch(f'{self.host}/api.php/Appfox/index', headers=self.headers, verify=False).json()
data = response['data']
videos = []
for i in data:
for j in i.get('banner', []):
videos.append(j)
for k in i.get('categories', []):
for l in k.get('videos', []):
videos.append(l)
return {'list': videos}
def categoryContent(self, tid, pg, filter, extend):
if not self.host: return None
response = self.fetch(
f"{self.host}/api.php/Appfox/vodList?type_id={tid}&class=全部&area=全部&lang=全部&year=全部&sort=最新&page={pg}",
headers=self.headers, verify=False).json()
videos = []
for i in response['data']['recommend_list']:
videos.append(i)
return {'list': videos}
def searchContent(self, key, quick, pg='1'):
if not self.host: return None
path = f"{self.host}/api.php/Appfox/vod?ac=detail&wd={key}"
if self.froms: path += '&from=' + self.froms
response = self.fetch(path, headers=self.headers, verify=False).json()
self.detail = response['list']
return response
def detailContent(self, ids):
video = next((i for i in self.detail if str(i['vod_id']) == str(ids[0])), None)
if not video:
detail_response = self.fetch(f"{self.host}/api.php/Appfox/vod?ac=detail&ids={ids[0]}", headers=self.headers,
verify=False).json()
video = detail_response.get('list')[0]
if not video: return {'list': []}
play_from = video['vod_play_from'].split('$$$')
play_urls = video['vod_play_url'].split('$$$')
try:
config_response = self.fetch(f"{self.host}/api.php/Appfox/config", headers=self.headers,
verify=False).json()
player_list = config_response.get('data', {}).get('playerList', [])
jiexi_data_list = config_response.get('data', {}).get('jiexiDataList', [])
except Exception:
return {'list': [video]}
player_map = {player['playerCode']: player for player in player_list}
processed_play_urls = []
for idx, play_code in enumerate(play_from):
if play_code in player_map:
player_info = player_map[play_code]
if player_info['playerCode'] != player_info['playerName']:
play_from[idx] = f"{player_info['playerName']}\u2005({play_code})"
if idx < len(play_urls):
urls = play_urls[idx].split('#')
processed_urls = []
for url in urls:
parts = url.split('$')
if len(parts) >= 2:
parts[1] = f"{play_code}@{parts[1]}"
processed_urls.append('$'.join(parts))
else:
processed_urls.append(url)
processed_play_urls.append('#'.join(processed_urls))
video['vod_play_from'] = '$$$'.join(play_from)
video['vod_play_url'] = '$$$'.join(processed_play_urls)
self.parses.update({p['playerCode']: p['url'] for p in jiexi_data_list if p.get('url', '').startswith('http')})
return {'list': [video]}
def playerContent(self, flag, id, vipflags):
play_from, raw_url = id.split('@', 1)
jx, parse, parsed = 1, 0, 0
url = raw_url
parses_main = []
if self.custom_first == 1:
parses_main.append(self.custom_parses)
parses_main.append(self.parses)
else:
parses_main.append(self.parses)
parses_main.append(self.custom_parses)
for parses2 in parses_main:
if not parsed and not re.match(r'https?://.*\.(m3u8|mp4|flv)', url):
for key, parsers in parses2.items():
if play_from not in key:
continue
if isinstance(parsers, list):
for parser in parsers:
if parser.startswith('parse:'):
url, jx, parse = parser.split('parse:')[1] + raw_url, 0, 1
break
try:
response = self.fetch(f"{parser}{raw_url}", headers=self.headers, verify=False).json()
if response.get('url', '').startswith('http'):
url, parsed = response['url'], 1
break
except Exception:
continue
else:
if parsers.startswith('parse:'):
url, jx, parse = parsers.split('parse:')[1] + raw_url, 0, 1
break
try:
response = self.fetch(f"{parsers}{raw_url}", headers=self.headers, verify=False).json()
if response.get('url', '').startswith('http'):
url, parsed = response['url'], 1
break
except Exception:
continue
if parsed or parse:
break
if parsed or parse:
break
if re.match(r'https?:\/\/.*\.(m3u8|mp4|flv)', url) or parsed == 1:
jx = 0
return {'jx': jx, 'parse': parse, 'url': url, 'header': {
'User-Agent': 'Mozilla/5.0 (iPhone; CPU iPhone OS 13_2_3 like Mac OS X) AppleWebKit/605.1.15 (KHTML, like Gecko) Version/13.0.3 Mobile/15E148 Safari/604.1'}}
def getName(self):
return 'AppFox'
def isVideoFormat(self, url):
pass
def manualVideoCheck(self):
pass
def destroy(self):
pass
def localProxy(self, param):
pass