Python module (submodule repositary), which provides content (video streams) from various online stream sources to corresponding Enigma2, Kodi, Plex plugins

Downloader.py 12KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293
  1. #from boxbranding import getMachineBrand, getMachineName
  2. import sys,os, os.path, re
  3. import urlparse, requests
  4. from twisted.web import client
  5. from twisted.internet import reactor, defer, ssl
  6. USER_AGENT = "Enigma2 HbbTV/1.1.1 (+PVR+RTSP+DL;OpenATV;;;)"
  7. #####################################################################################################
  8. class HTTPProgressDownloader(client.HTTPDownloader):
  9. def __init__(self, url, outfile, headers=None):
  10. agent = USER_AGENT
  11. if headers and "user-agent" in headers:
  12. agent = headers["user-agent"]
  13. if headers and "User-Agent" in headers:
  14. agent = headers["User-Agent"]
  15. client.HTTPDownloader.__init__(self, url, outfile, headers=headers, agent=agent)
  16. self.status = None
  17. self.progress_callback = None
  18. self.deferred = defer.Deferred()
  19. def noPage(self, reason):
  20. if self.status == "304":
  21. print reason.getErrorMessage()
  22. client.HTTPDownloader.page(self, "")
  23. else:
  24. client.HTTPDownloader.noPage(self, reason)
  25. def gotHeaders(self, headers):
  26. if self.status == "200":
  27. if headers.has_key("content-length"):
  28. self.totalbytes = int(headers["content-length"][0])
  29. else:
  30. self.totalbytes = 0
  31. self.currentbytes = 0.0
  32. return client.HTTPDownloader.gotHeaders(self, headers)
  33. def pagePart(self, packet):
  34. if self.status == "200":
  35. self.currentbytes += len(packet)
  36. if self.totalbytes and self.progress_callback:
  37. self.progress_callback(self.currentbytes, self.totalbytes)
  38. return client.HTTPDownloader.pagePart(self, packet)
  39. def pageEnd(self):
  40. return client.HTTPDownloader.pageEnd(self)
  41. class DownloadWithProgress:
  42. def __init__(self, url, outputfile, headers=None, limit=0, contextFactory=None, *args, **kwargs):
  43. self.limit = limit
  44. uri = urlparse.urlparse(url)
  45. scheme = uri.scheme
  46. host = uri.hostname
  47. port = uri.port if uri.port else 80
  48. path = uri.path
  49. if not headers:
  50. headers = {"user-agent":USER_AGENT}
  51. self.factory = HTTPProgressDownloader(url, outputfile, headers, *args, **kwargs)
  52. if scheme == "https":
  53. self.connection = reactor.connectSSL(host, port, self.factory, ssl.ClientContextFactory())
  54. else:
  55. self.connection = reactor.connectTCP(host, port, self.factory)
  56. def start(self):
  57. return self.factory.deferred
  58. def stop(self):
  59. if self.connection:
  60. print "[stop]"
  61. self.connection.disconnect()
  62. def addProgress(self, progress_callback):
  63. print "[addProgress]"
  64. self.factory.progress_callback = progress_callback
  65. #####################################################################################################
  66. class DownloadWithProgressFragmented:
  67. def __init__(self, url, outputfile, headers = None, limit = 0, contextFactory=None, *args, **kwargs):
  68. self.url = url
  69. self.outputfile = outputfile
  70. self.base_url = "/".join(url.split("/")[:-1])+"/"
  71. self.headers = headers if headers else {"user-agent":"Enigma2"}
  72. self.limit = limit
  73. self.agent = kwargs["agent"] if "agent" in kwargs else None
  74. self.cookie = kwargs["cookie"] if "cookie" in kwargs else None
  75. self.deferred = defer.Deferred()
  76. #self.deferred.addCallback(self.start_download)
  77. def start_download(self):
  78. print "Start download"
  79. try:
  80. r = requests.get(self.url,headers=self.headers)
  81. except Exception as e:
  82. #self.deferred.errback("Cannot open manifsest file - %s"%url)
  83. self.deferred.errback(e)
  84. if not r.content.startswith("#EXTM3U"):
  85. self.deferred.errback(Exception("Not valid manifest file - %s"%self.url))
  86. streams = re.findall(r"#EXT-X-STREAM-INF:.*?BANDWIDTH=(\d+).*?\n(.+?)$", r.content, re.IGNORECASE | re.MULTILINE)
  87. if streams:
  88. sorted(streams, key=lambda item: int(item[0]), reverse=True)
  89. url = streams[0][1]
  90. if not url.startswith("http"):
  91. url = self.base_url + url
  92. try:
  93. r = requests.get(url, headers=self.headers)
  94. except Exception as e:
  95. self.deferred.errback(Exception("Cannot open manifsest file - %s"%url))
  96. self.ts_list = re.findall(r"#EXTINF:([\d\.]+),.*?\n(.+?)$", r.content, re.IGNORECASE | re.MULTILINE)
  97. if not len(self.ts_list):
  98. self.deferred.errback(Exception("Cannot read fragment list in manifsest file - %s"%url))
  99. self.ts_num = 0
  100. self.type = "vod" if "#EXT-X-ENDLIST" in r.content else "live"
  101. self.currentbytes = 0.0
  102. self.totalbytes = -1
  103. self.currenttime = 0.0
  104. self.totaltime = sum(map(float,zip(*self.ts_list)[0]))
  105. self.ts_file = open(self.outputfile, "wb")
  106. self.download_fragment()
  107. def download_fragment(self):
  108. if self.ts_num>=len(self.ts_list):
  109. pass
  110. #print "Call later"
  111. reactor.callLater(10,self.update_manifest)
  112. reactor.callLater(10, self.download_fragment)
  113. else:
  114. print "Start fragment download"
  115. url = self.ts_list[self.ts_num][1]
  116. if not "://" in url:
  117. url = self.base_url+url
  118. self.d = client.getPage(url,headers = self.headers)
  119. self.d.addCallbacks(self.download_ok,self.download_err)
  120. def download_ok(self,content):
  121. content_length = len(content)
  122. self.currentbytes += content_length
  123. self.currenttime += float(self.ts_list[self.ts_num][0])
  124. self.totalbytes = self.currentbytes * self.totaltime / self.currenttime
  125. self.ts_num += 1
  126. #print "Fragment %s downloaded (%s)"%(self.ts_num,len(content))
  127. self.ts_file.write(content)
  128. self.progress_callback(self.currentbytes, self.totalbytes)
  129. if self.type == "vod":
  130. if self.ts_num >= len(self.ts_list) or (self.limit and self.currenttime>self.limit):
  131. self.ts_file.close()
  132. self.download_finished()
  133. else:
  134. self.download_fragment()
  135. else:
  136. if self.limit and self.currenttime>self.limit: # TODO
  137. self.ts_file.close()
  138. self.download_finished()
  139. else:
  140. self.download_fragment()
  141. def update_manifest(self):
  142. self.d2 = client.getPage(self.url, headers=self.headers)
  143. self.d2.addCallbacks(self.update_manifest_ok, self.update_manifest_err)
  144. def update_manifest_ok(self,content):
  145. print "Update manifest"
  146. ts_list = re.findall(r"#EXTINF:([\d\.]+),\n(.+?)$", content, re.IGNORECASE | re.MULTILINE)
  147. last_ts = self.ts_list[-1]
  148. found = False
  149. for ts in ts_list:
  150. if ts == last_ts:
  151. found = True
  152. elif found:
  153. print "Append %s"%ts[1]
  154. self.ts_list.append(ts)
  155. #reactor.callLater(5,self.download_fragment)
  156. def update_manifest_err(self,content):
  157. return
  158. def download_err(self,content):
  159. self.deferred.errback("Error while downloading %s"%self.ts_list[self.ts_num][1])
  160. def download_finished(self):
  161. self.totalbytes = self.currentbytes
  162. self.deferred.callback("Done")
  163. def start(self):
  164. reactor.callLater(1,self.start_download)
  165. return self.deferred
  166. def stop(self):
  167. self.deferred.errback() # TODO
  168. def addProgress(self, progress_callback):
  169. print "[addProgress]"
  170. self.progress_callback = progress_callback
  171. #####################################################################################################
  172. def get_header(url,headers=None):
  173. headers = {"user-agent":USER_AGENT}
  174. r = requests.head(url,headers=headers)
  175. return r.headers
  176. def get_ext(mtype):
  177. stype = "http"
  178. if mtype in ("vnd.apple.mpegURL","application/x-mpegURL",'application/x-mpegurl',"application/vnd.apple.mpegurl"):
  179. return ".ts","hls"
  180. elif mtype in ("application/dash+xml"):
  181. return ".ts","dash" # TODO dash stream type could be different !
  182. elif mtype in ("video/mp4"):
  183. return ".mp4","http"
  184. elif mtype in ("video/MP2T","video/mp2t"):
  185. return ".ts","http"
  186. elif mtype in ("video/x-flv"):
  187. return ".flv","http"
  188. elif mtype in ("video/quicktime"):
  189. return ".mov","http"
  190. elif mtype in ("video/x-msvideo"):
  191. return ".avi","http"
  192. elif mtype in ("video/x-ms-wmv"):
  193. return ".wmv","http"
  194. elif mtype in ("video/x-matroska"):
  195. return ".mkv","http"
  196. else:
  197. return ".mp4","http"
  198. ##############################################
  199. def print_progress(currentbytes, totalbytes):
  200. progress = float(currentbytes)/float(totalbytes)*100
  201. print "%s (%i/%i)"%(progress,currentbytes,totalbytes)
  202. def download_ok(*args):
  203. print "Download OK"
  204. reactor.stop()
  205. def download_err(e):
  206. print "Download Error %s"%e.getBriefTraceback()
  207. pass
  208. def stop():
  209. reactor.stop()
  210. ###############################################
  211. def download_video(stream):
  212. stream = stream[0]
  213. url = stream["url"]
  214. headers = stream["headers"]
  215. output = stream["name"].replace("\\"," ").replace(":"," ").replace("|"," ")
  216. try:
  217. h = get_header(url,headers={"user-agent":"Enigma2"})
  218. mtype = h.get("content-type")
  219. ext,stream_type = get_ext(mtype)
  220. except:
  221. ext,stream_type = (".ts","hls")
  222. #output = urlparse.urlparse(url)[2].split('/')[-1] + ext
  223. output = output+ext
  224. output = os.path.join("downloads", output)
  225. if stream_type == "hls":
  226. d = DownloadWithProgressFragmented(url,output,headers={"user-agent":"Enigma2"})
  227. else:
  228. d = DownloadWithProgress(url,output,headers={"user-agent":"Enigma2"})
  229. d.addProgress(print_progress)
  230. d.start().addCallback(download_ok).addErrback(download_err)
  231. reactor.run()
  232. if __name__ == "__main__":
  233. if len(sys.argv)>2:
  234. url= sys.argv[1]
  235. output = sys.argv[1]
  236. else:
  237. url = "http://walterebert.com/playground/video/hls/ts/480x270.m3u8"
  238. url = "https://r3---sn-bavc5ajvh-gpme.googlevideo.com/videoplayback?key=yt6&mime=video%2Fmp4&sparams=clen%2Cdur%2Cei%2Cgir%2Cid%2Cinitcwndbps%2Cip%2Cipbits%2Citag%2Clmt%2Cmime%2Cmm%2Cmn%2Cms%2Cmv%2Cpl%2Cratebypass%2Crequiressl%2Csource%2Cupn%2Cexpire&expire=1490986184&lmt=1490940183963773&dur=1302.639&itag=18&ratebypass=yes&mm=31&requiressl=yes&ipbits=0&upn=azFGj8gY02w&ip=85.254.87.15&pl=23&ei=aFDeWLzqDcn-dLC_gdAM&signature=083F353AC09CD98A70AD7D9438DD3C91C781166B.715456B9C35F040BDC4728CA76A0D1779B684A90&source=youtube&mv=m&mt=1490964451&ms=au&mn=sn-bavc5ajvh-gpme&gir=yes&clen=73596250&id=o-AGH9y-hWn1MtW1VzCyI_8XYYEWODsTDBZbfagQH3BrfQ&initcwndbps=4493750"
  239. #url = "http://techslides.com/demos/sample-videos/small.mp4"
  240. #url = "http://wx17.poiuytrew.pw/s/c507282042b1bf25e0b72c34a68426f3/hd_30/Jackie.2016.D.iTunes.BDRip.1080p_720.mp4"
  241. #url = "http://player.tvnet.lv/live/amlst:11/chunklist_w361981294_b528000.m3u8"
  242. #url = "http://vod-hls-uk-live.akamaized.net/usp/auth/vod/piff_abr_full_hd/a3e90e-b08ktytr/vf_b08ktytr_f9d55583-afc7-49bb-9bf4-d8f1ac99f56f.ism.hlsv2.ism/vf_b08ktytr_f9d55583-afc7-49bb-9bf4-d8f1ac99f56f.ism.hlsv2-audio=128000-video=5070000.m3u8"
  243. #url = "https://58174450afee9.streamlock.net/vod/mp4:_definst_/f/e/8e49fc32.mp4/playlist.m3u8?safwerwfasendtime=1490877870&safwerwfasstarttime=1490859339&safwerwfashash=hS2FfVZysQVazBQ6RJn1IhUevBkKxIF09Ly3BjfT43U="
  244. try:
  245. h = get_header(url,headers={"user-agent":"Enigma2"})
  246. mtype = h.get("content-type")
  247. ext,stream_type = get_ext(mtype)
  248. except:
  249. ext,stream_type = (".ts","hls")
  250. output = urlparse.urlparse(url)[2].split('/')[-1] + ext
  251. output = os.path.join("downloads", output)
  252. if stream_type == "hls":
  253. d = DownloadWithProgressFragmented(url,output,headers={"user-agent":"Enigma2"})
  254. else:
  255. d = DownloadWithProgress(url,output,headers={"user-agent":"Enigma2"})
  256. d.addProgress(print_progress)
  257. d.start().addCallback(download_ok).addErrback(download_err)
  258. reactor.run()