2
0

py_Gzjy.py 6.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241
  1. #coding=utf-8
  2. #!/usr/bin/python
  3. import sys
  4. sys.path.append('..')
  5. from base.spider import Spider
  6. import json
  7. import time
  8. import base64
  9. import requests
  10. class Spider(Spider): # 元类 默认的元类 type
  11. def getName(self):
  12. return "高中教育"
  13. def init(self,extend=""):
  14. print("============{0}============".format(extend))
  15. pass
  16. def isVideoFormat(self,url):
  17. pass
  18. def manualVideoCheck(self):
  19. pass
  20. def homeContent(self,filter):
  21. result = {}
  22. cateManual = {
  23. "高一语文": "高一语文",
  24. "高一数学": "高一数学",
  25. "高一英语": "高一英语",
  26. "高一历史": "高一历史",
  27. "高一地理": "高一地理",
  28. "高一生物": "高一生物",
  29. "高一思想政治": "高一思想政治",
  30. "高一物理": "高一物理",
  31. "高一化学": "高一化学",
  32. "高二语文": "高二语文",
  33. "高二数学": "高二数学",
  34. "高二英语": "高二英语",
  35. "高二历史": "高二历史",
  36. "高二地理": "高二地理",
  37. "高二生物": "高二生物",
  38. "高二思想政治": "高二思想政治",
  39. "高二物理": "高二物理",
  40. "高二化学": "高二化学",
  41. "高三语文": "高三语文",
  42. "高三数学": "高三数学",
  43. "高三英语": "高三英语",
  44. "高三历史": "高三历史",
  45. "高三地理": "高三地理",
  46. "高三生物": "高三生物",
  47. "高三思想政治": "高三思想政治",
  48. "高三物理": "高三物理",
  49. "高三化学": "高三化学",
  50. "高一语文": "高一语文",
  51. "高一数学": "高一数学",
  52. "高一英语": "高一英语",
  53. "高一历史": "高一历史",
  54. "高一地理": "高一地理",
  55. "高一生物": "高一生物",
  56. "高一思想政治": "高一思想政治",
  57. "高一物理": "高一物理",
  58. "高一化学": "高一化学",
  59. "高二语文": "高二语文",
  60. "高二数学": "高二数学",
  61. "高二英语": "高二英语",
  62. "高二历史": "高二历史",
  63. "高二地理": "高二地理",
  64. "高二生物": "高二生物",
  65. "高二思想政治": "高二思想政治",
  66. "高二物理": "高二物理",
  67. "高二化学": "高二化学",
  68. "高三语文": "高三语文",
  69. "高三数学": "高三数学",
  70. "高三英语": "高三英语",
  71. "高三历史": "高三历史",
  72. "高三地理": "高三地理",
  73. "高三生物": "高三生物",
  74. "高三思想政治": "高三思想政治",
  75. "高三物理": "高三物理",
  76. "高三化学": "高三化学",
  77. "高中信息技术": "高中信息技术"
  78. }
  79. classes = []
  80. for k in cateManual:
  81. classes.append({
  82. 'type_name':k,
  83. 'type_id':cateManual[k]
  84. })
  85. result['class'] = classes
  86. if(filter):
  87. result['filters'] = self.config['filter']
  88. return result
  89. def homeVideoContent(self):
  90. result = {
  91. 'list':[]
  92. }
  93. return result
  94. cookies = ''
  95. def getCookie(self):
  96. cookies_str = self.fetch("https://agit.ai/138001380000/MHQTV/raw/branch/master/bbcookie.txt").text
  97. cookies_dic = dict([co.strip().split('=') for co in cookies_str.split(';')])
  98. rsp = requests.session()
  99. cookies_jar = requests.utils.cookiejar_from_dict(cookies_dic)
  100. rsp.cookies = cookies_jar
  101. content = self.fetch("http://api.bilibili.com/x/web-interface/nav", cookies=rsp.cookies)
  102. res = json.loads(content.text)
  103. if res["code"] == 0:
  104. self.cookies = rsp.cookies
  105. else:
  106. rsp = self.fetch("https://www.bilibili.com/")
  107. self.cookies = rsp.cookies
  108. return rsp.cookies
  109. def categoryContent(self,tid,pg,filter,extend):
  110. result = {}
  111. url = 'https://api.bilibili.com/x/web-interface/search/type?search_type=video&keyword={0}&duration=4&page={1}'.format(tid,pg)
  112. if len(self.cookies) <= 0:
  113. self.getCookie()
  114. rsp = self.fetch(url,cookies=self.cookies)
  115. content = rsp.text
  116. jo = json.loads(content)
  117. if jo['code'] != 0:
  118. rspRetry = self.fetch(url,cookies=self.getCookie())
  119. content = rspRetry.text
  120. jo = json.loads(content)
  121. videos = []
  122. vodList = jo['data']['result']
  123. for vod in vodList:
  124. aid = str(vod['aid']).strip()
  125. title = vod['title'].strip().replace("<em class=\"keyword\">","").replace("</em>","")
  126. img = 'https:' + vod['pic'].strip()
  127. remark = str(vod['duration']).strip()
  128. videos.append({
  129. "vod_id":aid,
  130. "vod_name":title,
  131. "vod_pic":img,
  132. "vod_remarks":remark
  133. })
  134. result['list'] = videos
  135. result['page'] = pg
  136. result['pagecount'] = 9999
  137. result['limit'] = 90
  138. result['total'] = 999999
  139. return result
  140. def cleanSpace(self,str):
  141. return str.replace('\n','').replace('\t','').replace('\r','').replace(' ','')
  142. def detailContent(self,array):
  143. aid = array[0]
  144. url = "https://api.bilibili.com/x/web-interface/view?aid={0}".format(aid)
  145. rsp = self.fetch(url,headers=self.header)
  146. jRoot = json.loads(rsp.text)
  147. jo = jRoot['data']
  148. title = jo['title'].replace("<em class=\"keyword\">","").replace("</em>","")
  149. pic = jo['pic']
  150. desc = jo['desc']
  151. typeName = jo['tname']
  152. vod = {
  153. "vod_id":aid,
  154. "vod_name":title,
  155. "vod_pic":pic,
  156. "type_name":typeName,
  157. "vod_year":"",
  158. "vod_area":"",
  159. "vod_remarks":"",
  160. "vod_actor":"",
  161. "vod_director":"",
  162. "vod_content":desc
  163. }
  164. ja = jo['pages']
  165. playUrl = ''
  166. for tmpJo in ja:
  167. cid = tmpJo['cid']
  168. part = tmpJo['part']
  169. playUrl = playUrl + '{0}${1}_{2}#'.format(part,aid,cid)
  170. vod['vod_play_from'] = 'B站'
  171. vod['vod_play_url'] = playUrl
  172. result = {
  173. 'list':[
  174. vod
  175. ]
  176. }
  177. return result
  178. def searchContent(self,key,quick):
  179. result = {
  180. 'list':[]
  181. }
  182. return result
  183. def playerContent(self,flag,id,vipFlags):
  184. # https://www.555dianying.cc/vodplay/static/js/playerconfig.js
  185. result = {}
  186. ids = id.split("_")
  187. url = 'https://api.bilibili.com:443/x/player/playurl?avid={0}&cid=%20%20{1}&qn=112'.format(ids[0],ids[1])
  188. rsp = self.fetch(url, cookies=self.cookies)
  189. jRoot = json.loads(rsp.text)
  190. jo = jRoot['data']
  191. ja = jo['durl']
  192. maxSize = -1
  193. position = -1
  194. for i in range(len(ja)):
  195. tmpJo = ja[i]
  196. if maxSize < int(tmpJo['size']):
  197. maxSize = int(tmpJo['size'])
  198. position = i
  199. url = ''
  200. if len(ja) > 0:
  201. if position == -1:
  202. position = 0
  203. url = ja[position]['url']
  204. result["parse"] = 0
  205. result["playUrl"] = ''
  206. result["url"] = url
  207. result["header"] = {
  208. "Referer":"https://www.bilibili.com",
  209. "User-Agent":"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/100.0.4896.127 Safari/537.36"
  210. }
  211. result["contentType"] = 'video/x-flv'
  212. return result
  213. config = {
  214. "player": {},
  215. "filter": {}
  216. }
  217. header = {}
  218. def localProxy(self,param):
  219. return [200, "video/MP2T", action, ""]