py_bilibili.py 7.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265
  1. #coding=utf-8
  2. #!/usr/bin/python
  3. import sys
  4. sys.path.append('..')
  5. from base.spider import Spider
  6. import json
  7. import time
  8. import base64
  9. class Spider(Spider): # 元类 默认的元类 type
  10. def getName(self):
  11. return "TVBOX课堂"
  12. def init(self,extend=""):
  13. print("============{0}============".format(extend))
  14. pass
  15. def isVideoFormat(self,url):
  16. pass
  17. def manualVideoCheck(self):
  18. pass
  19. def homeContent(self,filter):
  20. result = {}
  21. cateManual = {
  22. "TVBox": "TVBox",
  23. "MT管理器": "MT管理器",
  24. "NP管理器": "NP管理器",
  25. "WebDAV": "WebDAV",
  26. "alist": "alist",
  27. "脱壳": "脱壳",
  28. "爬虫": "爬虫",
  29. "json&jar": "json&jar",
  30. "电影解说": "电影解说",
  31. "儿童早教": "儿童早教",
  32. "儿童启蒙故事": "儿童启蒙故事",
  33. "儿童英语启蒙": "儿童英语启蒙",
  34. "儿童歌曲": "儿童歌曲",
  35. "儿童绘画": "儿童绘画",
  36. "睡前故事": "睡前故事",
  37. "儿童动画": "儿童动画",
  38. "儿童音乐": "儿童音乐",
  39. "儿童安全教育": "儿童安全教育",
  40. "宝宝巴士": "宝宝巴士",
  41. "儿歌多多": "儿歌多多",
  42. "1年级语文": "1年级语文",
  43. "1年级数学": "1年级数学",
  44. "1年级英语": "1年级英语",
  45. "2年级语文": "2年级语文",
  46. "2年级数学": "2年级数学",
  47. "2年级英语": "2年级英语",
  48. "3年级语文": "3年级语文",
  49. "3年级数学": "3年级数学",
  50. "3年级英语": "3年级英语",
  51. "4年级语文": "4年级语文",
  52. "4年级数学": "4年级数学",
  53. "4年级英语": "4年级英语",
  54. "5年级语文": "5年级语文",
  55. "5年级数学": "5年级数学",
  56. "5年级英语": "5年级英语",
  57. "6年级语文": "6年级语文",
  58. "6年级数学": "6年级数学",
  59. "6年级英语": "6年级英语",
  60. "7年级语文": "7年级语文",
  61. "7年级数学": "7年级数学",
  62. "7年级英语": "7年级英语",
  63. "7年级历史": "7年级历史",
  64. "7年级地理": "7年级地理",
  65. "7年级生物": "7年级生物",
  66. "8年级语文": "8年级语文",
  67. "8年级数学": "8年级数学",
  68. "8年级英语": "8年级英语",
  69. "8年级历史": "8年级历史",
  70. "8年级地理": "8年级地理",
  71. "8年级生物": "8年级生物",
  72. "9年级语文": "9年级语文",
  73. "9年级数学": "9年级数学",
  74. "9年级英语": "9年级英语",
  75. "9年级历史": "9年级历史",
  76. "9年级地理": "9年级地理",
  77. "9年级生物": "9年级生物",
  78. "高一语文": "高一语文",
  79. "高一数学": "高一数学",
  80. "高一英语": "高一英语",
  81. "高一历史": "高一历史",
  82. "高一地理": "高一地理",
  83. "高一生物": "高一生物",
  84. "高一思想政治": "高一思想政治",
  85. "高一物理": "高一物理",
  86. "高一化学": "高一化学",
  87. "高二语文": "高二语文",
  88. "高二数学": "高二数学",
  89. "高二英语": "高二英语",
  90. "高二历史": "高二历史",
  91. "高二地理": "高二地理",
  92. "高二生物": "高二生物",
  93. "高二思想政治": "高二思想政治",
  94. "高二物理": "高二物理",
  95. "高二化学": "高二化学",
  96. "高三语文": "高三语文",
  97. "高三数学": "高三数学",
  98. "高三英语": "高三英语",
  99. "高三历史": "高三历史",
  100. "高三地理": "高三地理",
  101. "高三生物": "高三生物",
  102. "高三思想政治": "高三思想政治",
  103. "高三物理": "高三物理",
  104. "高三化学": "高三化学",
  105. "高中信息技术": "高中信息技术",
  106. "高中信息技术": "高中信息技术",
  107. "球星": "球星",
  108. "演讲": "演讲",
  109. "搞笑": "搞笑",
  110. "广场舞": "广场舞",
  111. "动物世界": "动物世界",
  112. "MTV": "MTV",
  113. "足球": "足球",
  114. "篮球": "篮球",
  115. "小姐姐": "小姐姐",
  116. "风景": "风景",
  117. "食谱": "食谱",
  118. "鬼畜": "鬼畜",
  119. "健身": "健身",
  120. "窗白噪音": "窗白噪音",
  121. "相声小品": "相声小品",
  122. "Zard": "Zard",
  123. "演唱会": "演唱会"
  124. }
  125. classes = []
  126. for k in cateManual:
  127. classes.append({
  128. 'type_name':k,
  129. 'type_id':cateManual[k]
  130. })
  131. result['class'] = classes
  132. if(filter):
  133. result['filters'] = self.config['filter']
  134. return result
  135. def homeVideoContent(self):
  136. result = {
  137. 'list':[]
  138. }
  139. return result
  140. cookies = ''
  141. def getCookie(self):
  142. rsp = self.fetch("https://www.bilibili.com/")
  143. self.cookies = rsp.cookies
  144. return rsp.cookies
  145. def categoryContent(self,tid,pg,filter,extend):
  146. result = {}
  147. url = 'https://api.bilibili.com/x/web-interface/search/type?search_type=video&keyword={0}&duration=4&page={1}'.format(tid,pg)
  148. if len(self.cookies) <= 0:
  149. self.getCookie()
  150. rsp = self.fetch(url,cookies=self.cookies)
  151. content = rsp.text
  152. jo = json.loads(content)
  153. if jo['code'] != 0:
  154. rspRetry = self.fetch(url,cookies=self.getCookie())
  155. content = rspRetry.text
  156. jo = json.loads(content)
  157. videos = []
  158. vodList = jo['data']['result']
  159. for vod in vodList:
  160. aid = str(vod['aid']).strip()
  161. title = vod['title'].strip().replace("<em class=\"keyword\">","").replace("</em>","")
  162. img = 'https:' + vod['pic'].strip()
  163. remark = str(vod['duration']).strip()
  164. videos.append({
  165. "vod_id":aid,
  166. "vod_name":title,
  167. "vod_pic":img,
  168. "vod_remarks":remark
  169. })
  170. result['list'] = videos
  171. result['page'] = pg
  172. result['pagecount'] = 9999
  173. result['limit'] = 90
  174. result['total'] = 999999
  175. return result
  176. def cleanSpace(self,str):
  177. return str.replace('\n','').replace('\t','').replace('\r','').replace(' ','')
  178. def detailContent(self,array):
  179. aid = array[0]
  180. url = "https://api.bilibili.com/x/web-interface/view?aid={0}".format(aid)
  181. rsp = self.fetch(url,headers=self.header)
  182. jRoot = json.loads(rsp.text)
  183. jo = jRoot['data']
  184. title = jo['title'].replace("<em class=\"keyword\">","").replace("</em>","")
  185. pic = jo['pic']
  186. desc = jo['desc']
  187. typeName = jo['tname']
  188. vod = {
  189. "vod_id":aid,
  190. "vod_name":title,
  191. "vod_pic":pic,
  192. "type_name":typeName,
  193. "vod_year":"",
  194. "vod_area":"",
  195. "vod_remarks":"",
  196. "vod_actor":"",
  197. "vod_director":"",
  198. "vod_content":desc
  199. }
  200. ja = jo['pages']
  201. playUrl = ''
  202. for tmpJo in ja:
  203. cid = tmpJo['cid']
  204. part = tmpJo['part']
  205. playUrl = playUrl + '{0}${1}_{2}#'.format(part,aid,cid)
  206. vod['vod_play_from'] = 'B站'
  207. vod['vod_play_url'] = playUrl
  208. result = {
  209. 'list':[
  210. vod
  211. ]
  212. }
  213. return result
  214. def searchContent(self,key,quick):
  215. result = {
  216. 'list':[]
  217. }
  218. return result
  219. def playerContent(self,flag,id,vipFlags):
  220. # https://www.555dianying.cc/vodplay/static/js/playerconfig.js
  221. result = {}
  222. ids = id.split("_")
  223. url = 'https://api.bilibili.com:443/x/player/playurl?avid={0}&cid=%20%20{1}&qn=112'.format(ids[0],ids[1])
  224. rsp = self.fetch(url)
  225. jRoot = json.loads(rsp.text)
  226. jo = jRoot['data']
  227. ja = jo['durl']
  228. maxSize = -1
  229. position = -1
  230. for i in range(len(ja)):
  231. tmpJo = ja[i]
  232. if maxSize < int(tmpJo['size']):
  233. maxSize = int(tmpJo['size'])
  234. position = i
  235. url = ''
  236. if len(ja) > 0:
  237. if position == -1:
  238. position = 0
  239. url = ja[position]['url']
  240. result["parse"] = 0
  241. result["playUrl"] = ''
  242. result["url"] = url
  243. result["header"] = {
  244. "Referer":"https://www.bilibili.com",
  245. "User-Agent":"Mozilla/5.0 (Macintosh; Intel Mac OS X 10_15_7) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/100.0.4896.127 Safari/537.36"
  246. }
  247. result["contentType"] = 'video/x-flv'
  248. return result
  249. config = {
  250. "player": {},
  251. "filter": {}
  252. }
  253. header = {}
  254. def localProxy(self,param):
  255. return [200, "video/MP2T", action, ""