2
0

py_Czjy.py 5.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204
  1. #coding=utf-8
  2. #!/usr/bin/python
  3. import sys
  4. sys.path.append('..')
  5. from base.spider import Spider
  6. import json
  7. import time
  8. import base64
  9. import requests
  10. class Spider(Spider): # 元类 默认的元类 type
  11. def getName(self):
  12. return "初中教育"
  13. def init(self,extend=""):
  14. print("============{0}============".format(extend))
  15. pass
  16. def isVideoFormat(self,url):
  17. pass
  18. def manualVideoCheck(self):
  19. pass
  20. def homeContent(self,filter):
  21. result = {}
  22. cateManual = {
  23. "7年级语文": "7年级语文",
  24. "7年级数学": "7年级数学",
  25. "7年级英语": "7年级英语",
  26. "7年级历史": "7年级历史",
  27. "7年级地理": "7年级地理",
  28. "7年级生物": "7年级生物",
  29. "7年级物理": "7年级物理",
  30. "7年级化学": "7年级化学",
  31. "8年级语文": "8年级语文",
  32. "8年级数学": "8年级数学",
  33. "8年级英语": "8年级英语",
  34. "8年级历史": "8年级历史",
  35. "8年级地理": "8年级地理",
  36. "8年级生物": "8年级生物",
  37. "8年级物理": "8年级物理",
  38. "8年级化学": "8年级化学",
  39. "9年级语文": "9年级语文",
  40. "9年级数学": "9年级数学",
  41. "9年级英语": "9年级英语",
  42. "9年级历史": "9年级历史",
  43. "9年级地理": "9年级地理",
  44. "9年级生物": "9年级生物",
  45. "9年级物理": "9年级物理",
  46. "9年级化学": "9年级化学"
  47. }
  48. classes = []
  49. for k in cateManual:
  50. classes.append({
  51. 'type_name':k,
  52. 'type_id':cateManual[k]
  53. })
  54. result['class'] = classes
  55. if(filter):
  56. result['filters'] = self.config['filter']
  57. return result
  58. def homeVideoContent(self):
  59. result = {
  60. 'list':[]
  61. }
  62. return result
  63. cookies = ''
  64. def getCookie(self):
  65. cookies_str = self.fetch("https://agit.ai/138001380000/MHQTV/raw/branch/master/bbcookie.txt").text
  66. cookies_dic = dict([co.strip().split('=') for co in cookies_str.split(';')])
  67. rsp = requests.session()
  68. cookies_jar = requests.utils.cookiejar_from_dict(cookies_dic)
  69. rsp.cookies = cookies_jar
  70. content = self.fetch("http://api.bilibili.com/x/web-interface/nav", cookies=rsp.cookies)
  71. res = json.loads(content.text)
  72. if res["code"] == 0:
  73. self.cookies = rsp.cookies
  74. else:
  75. rsp = self.fetch("https://www.bilibili.com/")
  76. self.cookies = rsp.cookies
  77. return rsp.cookies
  78. def categoryContent(self,tid,pg,filter,extend):
  79. result = {}
  80. url = 'https://api.bilibili.com/x/web-interface/search/type?search_type=video&keyword={0}&duration=4&page={1}'.format(tid,pg)
  81. if len(self.cookies) <= 0:
  82. self.getCookie()
  83. rsp = self.fetch(url,cookies=self.cookies)
  84. content = rsp.text
  85. jo = json.loads(content)
  86. if jo['code'] != 0:
  87. rspRetry = self.fetch(url,cookies=self.getCookie())
  88. content = rspRetry.text
  89. jo = json.loads(content)
  90. videos = []
  91. vodList = jo['data']['result']
  92. for vod in vodList:
  93. aid = str(vod['aid']).strip()
  94. title = vod['title'].strip().replace("<em class=\"keyword\">","").replace("</em>","")
  95. img = 'https:' + vod['pic'].strip()
  96. remark = str(vod['duration']).strip()
  97. videos.append({
  98. "vod_id":aid,
  99. "vod_name":title,
  100. "vod_pic":img,
  101. "vod_remarks":remark
  102. })
  103. result['list'] = videos
  104. result['page'] = pg
  105. result['pagecount'] = 9999
  106. result['limit'] = 90
  107. result['total'] = 999999
  108. return result
  109. def cleanSpace(self,str):
  110. return str.replace('\n','').replace('\t','').replace('\r','').replace(' ','')
  111. def detailContent(self,array):
  112. aid = array[0]
  113. url = "https://api.bilibili.com/x/web-interface/view?aid={0}".format(aid)
  114. rsp = self.fetch(url,headers=self.header)
  115. jRoot = json.loads(rsp.text)
  116. jo = jRoot['data']
  117. title = jo['title'].replace("<em class=\"keyword\">","").replace("</em>","")
  118. pic = jo['pic']
  119. desc = jo['desc']
  120. typeName = jo['tname']
  121. vod = {
  122. "vod_id":aid,
  123. "vod_name":title,
  124. "vod_pic":pic,
  125. "type_name":typeName,
  126. "vod_year":"",
  127. "vod_area":"",
  128. "vod_remarks":"",
  129. "vod_actor":"",
  130. "vod_director":"",
  131. "vod_content":desc
  132. }
  133. ja = jo['pages']
  134. playUrl = ''
  135. for tmpJo in ja:
  136. cid = tmpJo['cid']
  137. part = tmpJo['part']
  138. playUrl = playUrl + '{0}${1}_{2}#'.format(part,aid,cid)
  139. vod['vod_play_from'] = 'B站'
  140. vod['vod_play_url'] = playUrl
  141. result = {
  142. 'list':[
  143. vod
  144. ]
  145. }
  146. return result
  147. def searchContent(self,key,quick):
  148. result = {
  149. 'list':[]
  150. }
  151. return result
  152. def playerContent(self,flag,id,vipFlags):
  153. # https://www.555dianying.cc/vodplay/static/js/playerconfig.js
  154. result = {}
  155. ids = id.split("_")
  156. url = 'https://api.bilibili.com:443/x/player/playurl?avid={0}&cid=%20%20{1}&qn=112'.format(ids[0],ids[1])
  157. rsp = self.fetch(url, cookies=self.cookies)
  158. jRoot = json.loads(rsp.text)
  159. jo = jRoot['data']
  160. ja = jo['durl']
  161. maxSize = -1
  162. position = -1
  163. for i in range(len(ja)):
  164. tmpJo = ja[i]
  165. if maxSize < int(tmpJo['size']):
  166. maxSize = int(tmpJo['size'])
  167. position = i
  168. url = ''
  169. if len(ja) > 0:
  170. if position == -1:
  171. position = 0
  172. url = ja[position]['url']
  173. result["parse"] = 0
  174. result["playUrl"] = ''
  175. result["url"] = url
  176. result["header"] = {
  177. "Referer":"https://www.bilibili.com",
  178. "User-Agent":"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/100.0.4896.127 Safari/537.36"
  179. }
  180. result["contentType"] = 'video/x-flv'
  181. return result
  182. config = {
  183. "player": {},
  184. "filter": {}
  185. }
  186. header = {}
  187. def localProxy(self,param):
  188. return [200, "video/MP2T", action, ""]