# -*- coding: UTF-8 -*-
# /*
# *      Copyright (C) 2011 Libor Zoubek,ivars777
# *
# *
# *  This Program is free software; you can redistribute it and/or modify
# *  it under the terms of the GNU General Public License as published by
# *  the Free Software Foundation; either version 2, or (at your option)
# *  any later version.
# *
# *  This Program is distributed in the hope that it will be useful,
# *  but WITHOUT ANY WARRANTY; without even the implied warranty of
# *  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# *  GNU General Public License for more details.
# *
# *  You should have received a copy of the GNU General Public License
# *  along with this program; see the file COPYING.  If not, write to
# *  the Free Software Foundation, 675 Mass Ave, Cambridge, MA 02139, USA.
# *  http://www.gnu.org/copyleft/gpl.html
# *
# */
import os
import re
import sys
import urllib
import urllib2
import traceback
import cookielib
import requests
from htmlentitydefs import name2codepoint as n2cp
import HTMLParser
import StringIO

#import threading
#import Queue
import pickle
import string
import simplejson as json
#from demjson import demjson
#import demjson
import json
#from bs4 import BeautifulSoup

UA = 'Mozilla/6.0 (Windows; U; Windows NT 5.1; en-GB; rv:1.9.0.5) Gecko/2008092417 Firefox/3.0.3'
LOG = 2

_cookie_jar = None
CACHE_COOKIES = 'cookies'

def play_video(streams):
    if len(streams)>1:
        for i,s in enumerate(streams):
            
            print "%s: [%s,%s,%s] %s"%(i,s["quality"],s["lang"].encode("utf8"),s["type"],s["name"])
        a = raw_input("Select stram to play: ")
        try:
            n = int(a)
        except:
            n = 0
        if n>=len(streams):
            stream = streams[-1]
        else:
            stream = streams[n]
    else:
        stream = streams[0]

    title = stream["name"]
    url = stream["url"]
    suburl = ""
    print url
    if "subs" in stream and stream["subs"]:
        suburl = stream["subs"][0]["url"]
        print "\n**Download subtitles %s - %s"%(title,suburl)  
        subs = urllib2.urlopen(suburl).read()
        if subs:
            fname0 = re.sub("[/\n\r\t,]","_",title)                
            subext = ".srt"
            subfile = os.path.join("",fname0+subext)
            if ".xml" in suburl:
                subs = ttaf2srt(subs) 
            with open(subfile,"w") as f:
                f.write(subs)
        else:
            print "\n Error downloading subtitle %s"%suburl
    return player(url,stream["name"],suburl)
            
def player(url,title="",suburl=""):
    from subprocess import call
    print "\n**Play stream %s\n%s"%(title,url.encode("utf8"))
    cmd1 = [r"c:\Program Files\VideoLAN\VLC\vlc.exe",url,
           "--meta-title",title.decode("utf8").encode(sys.getfilesystemencoding()),
           "--http-user-agent","Enigma2"
    ]
    # gst-launch-1.0 -v souphttpsrc ssl-strict=false proxy=127.0.0.1:8888 extra-headers="Origin:adadadasd"  location="http://bitdash-a.akamaihd.net/content/sintel/sintel.mpd" ! decodebin! autovideosink
    cmd2 = [
        r"C:\gstreamer\1.0\x86_64\bin\gst-launch-1.0","-v",
        "playbin", 'uri="%s"'%url,
        #"souphttpsrc", "ssl-strict=false",       
        #"proxy=127.0.0.1:8888",
        #'location="%s"'%url,
        #'!decodebin!autovideosink'
    ]
    cmd = cmd1 if url.startswith("https") else cmd2
    ret = call(cmd)
    #if ret:
        #a = raw_input("*** Error, continue")
    return

SPLIT_CHAR = "~"
SPLIT_CODE = "%7E"
EQ_CODE = "%3D"
COL_CODE = "%3A"
PROXY_URL = "http://localhost:88/"

def streamproxy_encode(url,headers=[]):
    if not "?" in url:
        url = url+"?"
    url2 = url.replace(SPLIT_CHAR,SPLIT_CODE).replace(":",COL_CODE)
    url2 = PROXY_URL + url2
    if headers:
        headers2 = []
        for h in headers:
            headers2.append("%s=%s"%(h,headers[h].replace("=",EQ_CODE).replace(SPLIT_CHAR,SPLIT_CODE)))
        headers2 = SPLIT_CHAR.join(headers2)
        url2 = url2+SPLIT_CHAR+headers2
    return url2

def streamproxy_decode(urlp):
    import urlparse
    path = urlp.replace(re.search("http://[^/]+",urlp).group(0),"")
    p = path.split(SPLIT_CHAR)
    url = urllib.unquote(p[0][1:])
    #headers = {"User-Agent":"Mozilla/5.0 (iPhone; CPU iPhone OS 9_2 like Mac OS X) AppleWebKit/601.1 (KHTML, like Gecko) CriOS/47.0.2526.70 Mobile/13C71 Safari/601.1.46"}    
    headers={}
    if len(p)>1:
        for h in p[1:]:
            headers[h.split("=")[0]]=urllib.unquote(h.split("=")[1])
    return url,headers

class Captions(object):
    def __init__(self,uri):
        self.subs = []
        self.styles = {}
        if uri.startswith("http"):
            r = requests.get(uri)
        if r.status_code == 200:
            self.loads(r.content)
            
    def loads(self,s):
        if "WEBVTT" in s[:s.find("\n")]: # vtt captions
            self.load_vtt(s)
        elif "<?xml" in s[:s.find("\n")]:
            self.load_ttaf(s)
        else:
            return
        
    def load_ttaf(self,s):
        for r2 in re.findall("<style .+?/>", s):
            st = {}
            for a in re.findall(r'(\w+)="([^ "]+)"', r2):
                st[a[0]] = a[1]
                if a[0] == "id":
                    sid = a[1]
            self.styles[sid] = st  
        for r2 in re.findall("<p .+?</p>", s):
            sub = {}
            sub["begin"] = str2sec(re.search('begin="([^"]+)"', r2).group(1)) if re.search('begin="([^"]+)"', r2) else -1
            sub["end"] = str2sec(re.search('end="([^"]+)"', r2).group(1)) if re.search('end="([^"]+)"', r2) else -1
            sub["style"] = re.search('style="([^"]+)"', r2).group(1) if re.search('style="([^"]+)"', r2) else None
            sub["text"] = re.search("<p[^>]+>(.+)</p>", r2).group(1).replace("\n","")
            sub["text"] = re.sub("<br\s*?/>","\n",sub["text"])
            sub["text"] = re.sub("<.+?>"," ",sub["text"])
            self.subs.append(sub)  
        pass
                  
    def load_vtt(self,s):
        f = StringIO.StringIO(s)
        while True:
            line = f.readline()
            if not line:
                break
            m = re.search(r"([\d\.\,:]+)\s*-->\s*([\d\.\,\:]+)",line)
            if m:
                sub = {}
                sub["begin"] = str2sec(m.group(1))
                sub["end"] = str2sec(m.group(2))
                sub["style"] = None
                sub["text"] = []
                line = f.readline()
                while line.strip():
                    txt = line.strip()
                    if isinstance(txt,unicode):
                        txt = txt.encode("utf8")
                    sub["text"].append(txt)
                    line = f.readline()
                sub["text"] = "\n".join(sub["text"])
                self.subs.append(sub)                    
            else:
                continue
        pass
            
def str2sec(r):
    # Convert str time to miliseconds
    r= r.replace(",",".")
    m = re.search(r"(\d+\:)*(\d+)\:(\d+\.\d+)", r)
    if m:
        sec = int(m.group(1)[:-1])*60*60*1000 if m.group(1) else 0 
        sec += int(m.group(2))*60*1000 + int(float(m.group(3))*1000)
        return sec
    else:
        return -1

#c = Captions("http://195.13.216.2/mobile-vod/mp4:lb_barbecue_fr_lq.mp4/lb_barbecue_lv.vtt")  
#c = Captions("http://www.bbc.co.uk/iplayer/subtitles/ng/modav/bUnknown-0edd6227-0f38-411c-8d46-fa033c4c61c1_b05ql1s3_1479853893356.xml")
#url = "http://195.13.216.2/mobile-vod/mp4:ac_now_you_see_me_2_en_lq.mp4/ac_now_you_see_me_2_lv.vtt"
#c = Captions(url)

#pass


def ttaf2srt(s):
    out = u""
    i = 0
    for p,txt in re.findall("<p ([^>]+)>(.+?)</p>", s, re.DOTALL):
        i +=1
        begin = re.search('begin="(.+?)"',p).group(1)
        begin = begin.replace(".",",")
        end = re.search('end="(.+?)"',p).group(1)
        end = end.replace(".",",")
        txt2 = re.sub("<br */>","\n",txt)
        out += "%s\n%s --> %s\n%s\n\n"%(i,begin,end,txt2)
    return out    


def item():
    stream0 = {'name': '', 'url': '', 'quality': '???', 'surl': '', 'subs': '', 'headers': {},"desc":"","img":"","lang":"","type":"","order":0}            
    return stream0

class _StringCookieJar(cookielib.LWPCookieJar):

    def __init__(self, string=None, filename=None, delayload=False, policy=None):
        cookielib.LWPCookieJar.__init__(self, filename, delayload, policy)
        if string and len(string) > 0:
            self._cookies = pickle.loads(str(string))

    def dump(self):
        return pickle.dumps(self._cookies)


def init_urllib(cache=None):
    """
    Initializes urllib cookie handler
    """
    global _cookie_jar
    data = None
    if cache is not None:
        data = cache.get(CACHE_COOKIES)
    _cookie_jar = _StringCookieJar(data)
    opener = urllib2.build_opener(urllib2.HTTPCookieProcessor(_cookie_jar))
    urllib2.install_opener(opener)


def cache_cookies(cache):
    """
    Saves cookies to cache
    """
    global _cookie_jar
    if _cookie_jar:
        cache.set(CACHE_COOKIES, _cookie_jar.dump())


def request0(url, headers={}):
    debug('request: %s' % url)
    req = urllib2.Request(url, headers=headers)
    req.add_header('User-Agent', UA)
    try:
        response = urllib2.urlopen(req)
        data = response.read()
        response.close()
    except urllib2.HTTPError, error:
        data = error.read()    

    debug('len(data) %s' % len(data))
    return data

def request(url, headers={}):
    debug('request: %s' % url)
    #req = urllib2.Request(url, headers=headers)
    #req.add_header('User-Agent', UA)
    if 'User-Agent' not in headers:
        headers['User-Agent']= UA
    try:
        r = requests.get(url, headers=headers)
        data = r.content
    except:
        data = r.content   

    debug('len(data) %s' % len(data))
    return data

def post(url, data, headers={}):
    postdata = urllib.urlencode(data)
    #req = urllib2.Request(url, postdata, headers)
    #req.add_header('User-Agent', UA)
    import requests
    if 'User-Agent' not in headers:
        headers['User-Agent']= UA    
    try:
        r = requests.post(url, data=postdata,headers=headers)
        data = r.content
    except urllib2.HTTPError, error:
        data = r.content   
    return data

def post0(url, data, headers={}):
    postdata = urllib.urlencode(data)
    req = urllib2.Request(url, postdata, headers)
    req.add_header('User-Agent', UA)
    try:
        response = urllib2.urlopen(req)
        data = response.read()
        response.close()
    except urllib2.HTTPError, error:
        data = error.read()    
    return data


def post_json(url, data, headers={}):
    postdata = json.dumps(data)
    headers['Content-Type'] = 'application/json'
    req = urllib2.Request(url, postdata, headers)
    req.add_header('User-Agent', UA)
    response = urllib2.urlopen(req)
    data = response.read()
    response.close()
    return data


#def run_parallel_in_threads(target, args_list):
    #result = Queue.Queue()
    ## wrapper to collect return value in a Queue

    #def task_wrapper(*args):
        #result.put(target(*args))

    #threads = [threading.Thread(target=task_wrapper, args=args) for args in args_list]
    #for t in threads:
        #t.start()
    #for t in threads:
        #t.join()
    #return result


def substr(data, start, end):
    i1 = data.find(start)
    i2 = data.find(end, i1)
    return data[i1:i2]


def save_to_file(url, file):
    try:
        return save_data_to_file(request(url), file)
    except:
        traceback.print_exc()


def save_data_to_file(data, file):
    try:
        f = open(file, 'wb')
        f.write(data)
        f.close()
        info('File %s saved' % file)
        return True
    except:
        traceback.print_exc()


def read_file(file):
    if not os.path.exists(file):
        return ''
    f = open(file, 'r')
    data = f.read()
    f.close()
    return data


def _substitute_entity(match):
    ent = match.group(3)
    if match.group(1) == '#':
        # decoding by number
        if match.group(2) == '':
            # number is in decimal
            return unichr(int(ent))
        elif match.group(2) == 'x':
            # number is in hex
            return unichr(int('0x' + ent, 16))
    else:
        # they were using a name
        cp = n2cp.get(ent)
        if cp:
            return unichr(cp)
        else:
            return match.group()


def decode_html(data):
    if not type(data) == str:
        return data
    try:
        if not type(data) == unicode:
            data = unicode(data, 'utf-8', errors='ignore')
        entity_re = re.compile(r'&(#?)(x?)(\w+);')
        return entity_re.subn(_substitute_entity, data)[0]
    except:
        traceback.print_exc()
        print[data]
        return data

def unescape(s0):
    #s2 = re.sub("&#\w+;",HTMLParser.HTMLParser().unescape("\1"),s)
    s0 = s0.replace("&amp;","&")
    for s in re.findall("&#\w+;",s0):
        s2 = HTMLParser.HTMLParser().unescape(s)
        if isinstance(s0,str):
            s2 = s2.encode("utf8")
        s0 = s0.replace(s,s2)
        pass
    return s0

def debug(text):
    if LOG > 1:
        print('[DEBUG] ' + str([text]))

def info(text):
    if LOG > 0:
        print('[INFO] ' + str([text]))

def error(text):
    print('[ERROR] ' + str([text]))

_diacritic_replace = {u'\u00f3': 'o',
                      u'\u0213': '-',
                      u'\u00e1': 'a',
                      u'\u010d': 'c',
                      u'\u010c': 'C',
                      u'\u010f': 'd',
                      u'\u010e': 'D',
                      u'\u00e9': 'e',
                      u'\u011b': 'e',
                      u'\u00ed': 'i',
                      u'\u0148': 'n',
                      u'\u0159': 'r',
                      u'\u0161': 's',
                      u'\u0165': 't',
                      u'\u016f': 'u',
                      u'\u00fd': 'y',
                      u'\u017e': 'z',
                      u'\xed': 'i',
                      u'\xe9': 'e',
                      u'\xe1': 'a',
                      }


def replace_diacritic(string):
    ret = []
    for char in string:
        if char in _diacritic_replace:
            ret.append(_diacritic_replace[char])
        else:
            ret.append(char)
    return ''.join(ret)


def params(url=None):
    if not url:
        url = sys.argv[2]
    param = {}
    paramstring = url
    if len(paramstring) >= 2:
        params = url
        cleanedparams = params.replace('?', '')
        if (params[len(params) - 1] == '/'):
            params = params[0:len(params) - 2]
        pairsofparams = cleanedparams.split('&')
        param = {}
        for i in range(len(pairsofparams)):
            splitparams = {}
            splitparams = pairsofparams[i].split('=')
            if (len(splitparams)) == 2:
                param[splitparams[0]] = splitparams[1]
    for p in param.keys():
        param[p] = param[p].decode('hex')
    return param


def int_to_base(number, base):
    digs = string.digits + string.letters
    if number < 0:
        sign = -1
    elif number == 0:
        return digs[0]
    else:
        sign = 1
    number *= sign
    digits = []
    while number:
        digits.append(digs[number % base])
        number /= base
    if sign < 0:
        digits.append('-')
    digits.reverse()
    return ''.join(digits)


def extract_jwplayer_setup(data):
    """
    Extracts jwplayer setup configuration and returns it as a dictionary.

    :param data: A string to extract the setup from
    :return: A dictionary containing the setup configuration
    """
    data = re.search(r'<script.+?}\(\'(.+)\',\d+,\d+,\'([\w\|]+)\'.*</script>', data, re.I | re.S)
    if data:
        replacements = data.group(2).split('|')
        data = data.group(1)
        for i in reversed(range(len(replacements))):
            if len(replacements[i]) > 0:
                data = re.sub(r'\b%s\b' % int_to_base(i, 36), replacements[i], data)
        data = re.search(r'\.setup\(([^\)]+?)\);', data)
        if data:
            return json.loads(data.group(1).decode('string_escape'))
        #return demjson.decode(data.group(1).decode('string_escape')) ### III
    return None


#def parse_html(url):
#    return BeautifulSoup(request(url), 'html5lib', from_encoding='utf-8')

if __name__ == "__main__":
    s = 'B\xc4\x93thovena D\xc4\x81rgumu Taka (2014)/Beethoven&#x27;s Treasure [LV]'
    #s = s.decode("utf8")
    #s=unescape(s)
    #url = "http://localhost:88/https://walterebert.com/playground/video/hls/ts/480x270.m3u8?token=xxxx~User-Agent=Enigma2~Cookie=xxxxx"
    url = "http://hyt4d6.vkcache.com/secip/0/UMQ3q2gNjTlOPnEVm3iTiA/ODAuMjMyLjI0MC42/1479610800/hls-vod-s3/flv/api/files/videos/2015/09/11/144197748923a22.mp4.m3u8http://hyt4d6.vkcache.com/secip/0/Y-ZA1qRm8toplc0dN_L6_w/ODAuMjMyLjI0MC42/1479654000/hls-vod-s3/flv/api/files/videos/2015/09/11/144197748923a22.mp4.m3u8"
    headers = {"User-Agent":"Mozilla/5.0 (iPhone; CPU iPhone OS 9_2 like Mac OS X) AppleWebKit/601.1 (KHTML, like Gecko) CriOS/47.0.2526.70 Mobile/13C71 Safari/601.1.46"}
    urlp = streamproxy_encode(url,headers)
    print urlp
    player(urlp)
    
    pass