else/TotalDL/totaldl.py

import bs4
import json
import requests
import os
import time
import sys

HEADERS = {'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/42.0.2311.152 Safari/537.36'}

DOWNLOAD_DIRECTORY = ''
# Save files to this folder
# If blank, it uses the local folder

IMGUR_ALBUM_INDV = '<metaproperty="og:image"'
IMGUR_ALBUM_INDV2 = 'linkrel="image_src"'
# The HTML string which tells us that an image link is
# on this line.

IMGUR_ALBUMFOLDERS = True
# If True, the individual images belonging to an album will be placed
#  into a folder named after the album, like <album_id>/<img_id>.jpg
# Else, files will be named <album_id>_<img_id>.jpg and placed
#  in the local folder.

GFYCAT_MP4 = False
# If True, download gfycat urls in .mp4
# Else, .webm

GFYCAT_SUBDOMAINS = ['zippy', 'fat', 'giant']

SLEEPINESS = 2
# The number of seconds to wait in between making requests
# Similar to PRAW's ratelimit handling.
# Not required, but probably better for the environment.

VIMEO_DICT_START = '"files":{"h264":'
VIMEO_DICT_END = ',"hls"'
# The HTML string which tells us where the mp4 file is

VIMEO_PRIORITY = ['hd', 'sd', 'mobile']
# Download files in this priority

LIVELEAK_YOUTUBEIFRAME = 'youtube.com/embed'

LIVELEAK_RESOLUTIONS = ['h264_base', 'h264_720p', 'h264_270p']

YOUTUBE_DL_FORMAT = 'youtube-dl "{url}" --no-playlist --force-ipv4 -o "/{dir}/{name}.%(ext)s"'
# The format for the youtube-dl shell command

DO_GENERIC = True
# If true, attempt to download whatever URL goes in
# Else, only download from the explicitly supported sites

''' End user config '''

last_request = 0

if DOWNLOAD_DIRECTORY != '':
    if DOWNLOAD_DIRECTORY[-1] not in ['/', '\\']:
        DOWNLOAD_DIRECTORY += '\\'

    os.makedirs(DOWNLOAD_DIRECTORY, exist_ok=True)

class StatusExc(Exception):
    pass

def download_file(url, localname, headers={}):
    localname = os.path.join(DOWNLOAD_DIRECTORY, localname)
    dirname = os.path.split(localname)[0]
    if dirname != '':
        os.makedirs(dirname, exist_ok=True)
    if 'twimg' in url:
        localname = localname.replace(':large', '')
        localname = localname.replace(':small', '')
    if os.path.exists(localname):
        print('\t%s already exists!!' % localname)
        return localname
    print('\tDownloading %s' % localname)
    downloading = request_get(url, stream=True, headers=headers)
    localfile = open(localname, 'wb')
    for chunk in downloading.iter_content(chunk_size=1024):
        if chunk:
            localfile.write(chunk)
    localfile.close()
    return localname

def request_get(url, stream=False, headers={}):
    global last_request
    now = time.time()
    diff = now - last_request
    if diff < SLEEPINESS:
        diff = SLEEPINESS - diff
        time.sleep(diff)
    last_request = time.time()
    h = HEADERS.copy()
    h.update(headers)
    req = requests.get(url, stream=stream, headers=h)
    if req.status_code not in [200,206]:
        raise StatusExc("Status code %d on url %s" % (req.status_code, url))
    return req

##############################################################################
                                                                            ##
def handle_gfycat(url, customname=None):
    print('Gfycat')
    name = url.split('/')[-1]
    name = name.split('.')[0]
    if customname:
        filename = customname
    else:
        filename = name

    if GFYCAT_MP4:
        name += '.mp4'
        filename += '.mp4'
    else:
        name += '.webm'
        filename += '.webm'

    for subdomain in GFYCAT_SUBDOMAINS:
        url = 'http://%s.gfycat.com/%s' % (subdomain, name)
        try:
            return download_file(url, filename)
        except StatusExc:
            pass

def handle_liveleak(url, customname=None):
    print('Liveleak')
    if customname:
        name = customname
    else:
        name = url.split('=')[1]
    name += '.mp4'
    pagedata = request_get(url)
    pagedata = pagedata.text
    if LIVELEAK_YOUTUBEIFRAME in pagedata:
        pagedata = pagedata.split('\n')
        pagedata = [line for line in pagedata if LIVELEAK_YOUTUBEIFRAME in line]
        pagedata = pagedata[0]
        pagedata = pagedata.split('src="')[1]
        pagedata = pagedata.split('"')[0]
        print('\tFound youtube embed')
        handle_master(pagedata, customname=customname)
    else:
        pagedata = pagedata.split('file: "')[1]
        pagedata = pagedata.split('",')[0]
        original = pagedata
        pagedata = pagedata.split('.')
        for spoti in range(len(pagedata)):
            if 'h264_' in pagedata[spoti]:
                pagedata[spoti] = 'LIVELEAKRESOLUTION'
        pagedata = '.'.join(pagedata)
        for res in LIVELEAK_RESOLUTIONS:
            url = pagedata.replace('LIVELEAKRESOLUTION', res)
            try:
                return download_file(url, name)
            except StatusExc:
                pass
        return download_file(original, name)

def handle_imgur_html(url):
    print('Imgur')
    pagedata = request_get(url)
    pagedata = pagedata.text.replace(' ', '')
    pagedata = pagedata.split('\n')
    pagedata = [line for line in pagedata if IMGUR_ALBUM_INDV in line]
    pagedata = [line.split('content="')[1] for line in pagedata]
    links = [line.split('"')[0] for line in pagedata]
    links = [line.split('?')[0] for line in links]
    print(links)
    return links

def handle_imgur(url, albumid='', customname=None):
    print('Imgur')
    name = url.split('/')[-1]
    if 'imgur.com' in name:
        # This link doesn't appear to have an image id
        return

    url = url.replace('/gallery/', '/a/')
    basename = name.split('.')[0]
    if '.' in name:
        # This is a direct image link
        if customname:
            # replace the imgur ID with the customname, keep ext.
            name = '%s.%s' % (customname, name.split('.')[-1])
        if albumid and albumid != basename:

            if IMGUR_ALBUMFOLDERS:

                os.makedirs(DOWNLOAD_DIRECTORY + albumid, exist_ok=True)
                localpath = '%s\\%s' % (albumid, name)
    
            else:
                localpath = '%s_%s' % (albumid, name)

        else:
            localpath = name

        return download_file(url, localpath)

    else:
        # Not a direct image link, let's read the html.
        images = handle_imgur_html(url)
        if customname:
            name = customname
        print('\tFound %d images' % len(images))

        localfiles = []
        if len(images) > 1:
            for imagei in range(len(images)):
                image = images[imagei]
                iname = image.split('/')[-1]
                iname = iname.split('.')[0]
                x = handle_imgur(image, albumid=name, customname='%d_%s' % (imagei, iname))
                localfiles.append(x)
        else:
            x = handle_imgur(images[0], customname=name)
            localfiles.append(x)
        return localfiles

def handle_twitter(url, customname=None):
    print('Twitter')
    pagedata = request_get(url)
    pagedata = pagedata.text

    idnumber = url.split('status/')[1].split('/')[0]
    if customname:
        name = customname
    else:
        name = idnumber
        customname = idnumber
    tweetpath = '%s.html' % (DOWNLOAD_DIRECTORY + name)
    psplit = '<p class="TweetTextSize'
    tweettext = pagedata.split(psplit)[1]
    tweettext = tweettext.split('</p>')[0]
    tweettext = psplit + tweettext + '</p>'
    tweettext = '<html><body>%s</body></html>' % tweettext
    tweettext = tweettext.replace('/hashtag/', 'http://twitter.com/hashtag/')
    tweethtml = open(tweetpath, 'w', encoding='utf-8')
    tweethtml.write(tweettext)
    tweethtml.close()
    print('\tSaved tweet text')
    try:
        link = pagedata.split('data-url="')[1]
        link = link.split('"')[0]
        if link != url:
            handle_master(link, customname=customname)
        return tweetpath
    except IndexError:
        try:
            link = pagedata.split('data-expanded-url="')[1]
            link = link.split('"')[0]
            if link != url:
                handle_master(link, customname=customname)
            return tweetpath
        except IndexError:
            pass
    return tweetpath
    print('\tNo media detected')

def handle_vidble(url, customname=None):
    print('Vidble')
    if '/album/' in url:
        pagedata = request_get(url)
        pagedata.raise_for_status()
        pagedata = pagedata.text
        soup = bs4.BeautifulSoup(pagedata)
        images = soup.find_all('img')
        images = [i for i in images if i.attrs.get('src', None)]
        images = [i.attrs['src'] for i in images]
        images = [i for i in images if '/assets/' not in i]
        images = [i for i in images if i[0] == '/']
        if customname:
            folder = customname
        else:
            folder = url.split('/album/')[1].split('/')[0]
        for (index, image) in enumerate(images):
            name = image.split('/')[-1]
            localname = '{folder}\\{index}_{name}'.format(folder=folder, index=index, name=name)
            image = 'https://vidble.com' + image
            image = image.replace('_med', '')
            download_file(image, localname)
    else:
        localname = url.split('/')[-1]
        extension = os.path.splitext(localname)[1]
        localname = customname + extension
        download_file(url, localname)

def handle_vidme(url, customname=None):
    print('Vidme')
    if customname is None:
        customname = url.split('/')[-1]+'.mp4'
    pagedata = request_get(url)
    pagedata = pagedata.text
    pagedata = pagedata.split('\n')
    pagedata = [l for l in pagedata if '.mp4' in l and 'og:video:url' in l]
    pagedata = pagedata[0]
    pagedata = pagedata.split('content="')[1].split('"')[0]
    pagedata = pagedata.replace('&amp;', '&')
    headers = {'Referer': 'https://vid.me/',
               'Range':'bytes=0-',
               'Host':'d1wst0behutosd.cloudfront.net',
               'Cache-Control':'max-age=0'}

    return download_file(pagedata, customname, headers=headers)

def handle_vimeo(url, customname=None):
    print('Vimeo')
    name = url.split('/')[-1]
    name = name.split('?')[0]
    try:
        int(name)
    except ValueError as e:
        print('Could not identify filename of %s' % url)
        raise e
    url = 'http://player.vimeo.com/video/%s' % name
    pagedata = request_get(url)
    pagedata = pagedata.text
    pagedata = pagedata.replace('</script>', '<script')
    pagedata = pagedata.split('<script>')
    for chunk in pagedata:
        if VIMEO_DICT_START in chunk:
            break
    chunk = chunk.split(VIMEO_DICT_START)[1]
    chunk = chunk.split(VIMEO_DICT_END)[0]
    chunk = json.loads(chunk)
    
    for priority in VIMEO_PRIORITY:
        if priority in chunk:
            fileurl = chunk[priority]['url']
            break
    if customname:
        filename = customname + '.mp4'
    else:
        filename = name + '.mp4'
    return download_file(fileurl, filename)

def handle_youtube(url, customname=None):
    print('Youtube')
    url = url.replace('&amp;', '&')
    url = url.replace('feature=player_embedded&', '')
    url = url.replace('&feature=player_embedded', '')
    if not customname:
        os.system(YOUTUBE_DL_FORMAT.format(url=url, dir=DOWNLOAD_DIRECTORY, name='%(title)s'))
        return
    os.system(YOUTUBE_DL_FORMAT.format(url=url, dir=DOWNLOAD_DIRECTORY, name=customname))
    if DOWNLOAD_DIRECTORY:
        return '%s/%s.mp4' % (DOWNLOAD_DIRECTORY, customname)
    return '%s.mp4' % customname

def handle_generic(url, customname=None):
    print('Generic')
    try:
        remote_name = url.split('/')[-1]
        if customname:
            name = customname
        else:
            name = remote_name

        base = name.split('.')[0]
        if '.' in name:
            ext = name.split('.')[-1]
        elif '.' in remote_name:
            ext = remote_name.split('.')[-1]

        if ext in [base, '']:
            ext = 'html'
        print(base)
        print(ext)

        name = '%s.%s' % (base, ext)

        return download_file(url, name)
    except:
        pass
                                                                            ##
##############################################################################

HANDLERS = {
    'gfycat.com': handle_gfycat,
    'imgur.com': handle_imgur,
    'liveleak.com': handle_liveleak,
    'vid.me': handle_vidme,
    'vidble.com': handle_vidble,
    'vimeo.com': handle_vimeo,
    'youtube.com': handle_youtube,
    'youtu.be': handle_youtube,
    'twitter.com': handle_twitter
    }

def handle_master(url, customname=None):
    print('Handling %s' % url)
    for handlerkey in HANDLERS:
        if handlerkey.lower() in url.lower():
            return HANDLERS[handlerkey](url, customname=customname)
    if DO_GENERIC:
        return handle_generic(url, customname=customname)

def test_imgur():
    # Imgur gallery album
    handle_master('http://imgur.com/gallery/s4WLG')

    # Imgur standard album with customname
    handle_master('http://imgur.com/a/s4WLG', customname='album')

    # Imgur indirect 
    handle_master('http://imgur.com/gvJUct0')

    # Imgur indirect single with customname
    handle_master('http://imgur.com/gvJUct0', customname='indirect')

    # Imgur direct single
    handle_master('http://i.imgur.com/gvJUct0.jpg')

def test_gfycat():
    # Gfycat direct .gif
    handle_master('http://giant.gfycat.com/FatherlyBruisedIberianchiffchaff.gif')

    # Gfycat general link
    handle_master('http://www.gfycat.com/RawWetFlatcoatretriever')

    # Gfycat general link with customname
    handle_master('http://www.gfycat.com/RawWetFlatcoatretriever', customname='gfycatgeneral')

def test_vimeo():
    # Vimeo standard link
    handle_master('https://vimeo.com/109405701')

    # Vimeo player link with customname
    handle_master('https://player.vimeo.com/video/109405701', customname='vimeoplayer')

def test_liveleak():
    # LiveLeak standard link
    handle_master('http://www.liveleak.com/view?i=9d1_1429192014')

    # Liveleak article with youtube embed
    handle_master('http://www.liveleak.com/view?i=ab8_1367941301')

    # LiveLeak standard link with customname
    handle_master('http://www.liveleak.com/view?i=9d1_1429192014', customname='liveleak')

def test_youtube():
    # Youtube standard link
    handle_master('https://www.youtube.com/watch?v=bEgeh5hA5ko')

    # Youtube short link
    handle_master('https://youtu.be/GjOBTstnW20', customname='youtube')

    # Youtube player embed link
    handle_master('https://www.youtube.com/watch?feature=player_embedded&amp;v=bEgeh5hA5ko')

def test_twitter():
    # Tiwtter with twitter-image embed
    handle_master('https://twitter.com/PetoLucem/status/599493836214272000')

    # Twitter with twitter-image embed
    handle_master('https://twitter.com/Jalopnik/status/598287843128188929')

    # Twitter with twitter-image embed and customname
    handle_master('https://twitter.com/Jalopnik/status/598287843128188929', customname='twits')

    # Twitter with youtube embed
    handle_master('https://twitter.com/cp_orange_x3/status/599705117420457984')

    # Twitter plain text
    handle_master('https://twitter.com/cp_orange_x3/status/599700702382817280')

    # Twitter plain text
    handle_master('https://twitter.com/SyriacMFS/status/556513635913437184')

    # Twitter with arabic characters
    handle_master('https://twitter.com/HadiAlabdallah/status/600885154991706113')

def test_generic():
    # Some link that might work
    handle_master('https://raw.githubusercontent.com/voussoir/reddit/master/SubredditBirthdays/show/statistics.txt')

    # Some link that might work with customname
    handle_master('https://raw.githubusercontent.com/voussoir/reddit/master/SubredditBirthdays/show/statistics.txt', customname='sss')

    # Some link that might work
    handle_master('https://github.com/voussoir/reddit/tree/master/SubredditBirthdays/show')

if __name__ == '__main__':
    if len(sys.argv) > 1:
        handle_master(sys.argv[1])
    else:
        #test_imgur()
        #test_gfycat()
        #test_vimeo()
        test_liveleak()
        test_youtube()
        #test_twitter()
        #test_generic()
        pass
else 2016-03-07 20:25:50 +00:00			`import bs4`
else totaldl 1 2015-05-15 05:40:19 +00:00			`import json`
			`import requests`
			`import os`
			`import time`
else totaldl tweet text 2015-05-20 03:17:00 +00:00			`import sys`
else totaldl 1 2015-05-15 05:40:19 +00:00
			`HEADERS = {'User-Agent': 'Mozilla/5.0 (Windows NT 6.1; WOW64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/42.0.2311.152 Safari/537.36'}`

else totaldl 8 2015-05-16 02:27:24 +00:00			`DOWNLOAD_DIRECTORY = ''`
else totaldl 6 2015-05-16 00:24:00 +00:00			`# Save files to this folder`
			`# If blank, it uses the local folder`

else 2015-10-03 23:29:52 +00:00			`IMGUR_ALBUM_INDV = '<metaproperty="og:image"'`
else 2015-06-03 03:30:35 +00:00			`IMGUR_ALBUM_INDV2 = 'linkrel="image_src"'`
else totaldl 1 2015-05-15 05:40:19 +00:00			`# The HTML string which tells us that an image link is`
			`# on this line.`

			`IMGUR_ALBUMFOLDERS = True`
			`# If True, the individual images belonging to an album will be placed`
			`# into a folder named after the album, like <album_id>/<img_id>.jpg`
			`# Else, files will be named <album_id>_<img_id>.jpg and placed`
			`# in the local folder.`

else 2016-03-07 20:25:50 +00:00			`GFYCAT_MP4 = False`
else totaldl 1 2015-05-15 05:40:19 +00:00			`# If True, download gfycat urls in .mp4`
			`# Else, .webm`

			`GFYCAT_SUBDOMAINS = ['zippy', 'fat', 'giant']`

			`SLEEPINESS = 2`
			`# The number of seconds to wait in between making requests`
			`# Similar to PRAW's ratelimit handling.`
			`# Not required, but probably better for the environment.`

			`VIMEO_DICT_START = '"files":{"h264":'`
			`VIMEO_DICT_END = ',"hls"'`
			`# The HTML string which tells us where the mp4 file is`

			`VIMEO_PRIORITY = ['hd', 'sd', 'mobile']`
			`# Download files in this priority`

else totaldl 5 2015-05-16 00:01:23 +00:00			`LIVELEAK_YOUTUBEIFRAME = 'youtube.com/embed'`

else totaldl 7 2015-05-16 02:00:24 +00:00			`LIVELEAK_RESOLUTIONS = ['h264_base', 'h264_720p', 'h264_270p']`

else 2015-06-03 03:30:35 +00:00			`YOUTUBE_DL_FORMAT = 'youtube-dl "{url}" --no-playlist --force-ipv4 -o "/{dir}/{name}.%(ext)s"'`
			`# The format for the youtube-dl shell command`

else totaldl 1 2015-05-15 05:40:19 +00:00			`DO_GENERIC = True`
			`# If true, attempt to download whatever URL goes in`
			`# Else, only download from the explicitly supported sites`

			`''' End user config '''`

			`last_request = 0`

else totaldl 8 2015-05-16 02:27:24 +00:00			`if DOWNLOAD_DIRECTORY != '':`
else 2016-03-07 20:25:50 +00:00			`if DOWNLOAD_DIRECTORY[-1] not in ['/', '\\']:`
			`DOWNLOAD_DIRECTORY += '\\'`
else 2016-05-10 08:00:29 +00:00
			`os.makedirs(DOWNLOAD_DIRECTORY, exist_ok=True)`
else totaldl 6 2015-05-16 00:24:00 +00:00
else totaldl 1 2015-05-15 05:40:19 +00:00			`class StatusExc(Exception):`
else 2016-03-07 20:25:50 +00:00			`pass`
else totaldl 1 2015-05-15 05:40:19 +00:00
else It's been a while since I updated this. 2015-06-26 04:03:45 +00:00			`def download_file(url, localname, headers={}):`
else 2016-03-07 20:25:50 +00:00			`localname = os.path.join(DOWNLOAD_DIRECTORY, localname)`
			`dirname = os.path.split(localname)[0]`
else 2016-05-10 08:00:29 +00:00			`if dirname != '':`
			`os.makedirs(dirname, exist_ok=True)`
else 2016-03-07 20:25:50 +00:00			`if 'twimg' in url:`
			`localname = localname.replace(':large', '')`
			`localname = localname.replace(':small', '')`
			`if os.path.exists(localname):`
			`print('\t%s already exists!!' % localname)`
			`return localname`
			`print('\tDownloading %s' % localname)`
			`downloading = request_get(url, stream=True, headers=headers)`
			`localfile = open(localname, 'wb')`
			`for chunk in downloading.iter_content(chunk_size=1024):`
			`if chunk:`
			`localfile.write(chunk)`
			`localfile.close()`
			`return localname`
else totaldl 1 2015-05-15 05:40:19 +00:00
else It's been a while since I updated this. 2015-06-26 04:03:45 +00:00			`def request_get(url, stream=False, headers={}):`
else 2016-03-07 20:25:50 +00:00			`global last_request`
			`now = time.time()`
			`diff = now - last_request`
			`if diff < SLEEPINESS:`
			`diff = SLEEPINESS - diff`
			`time.sleep(diff)`
			`last_request = time.time()`
			`h = HEADERS.copy()`
			`h.update(headers)`
			`req = requests.get(url, stream=stream, headers=h)`
			`if req.status_code not in [200,206]:`
			`raise StatusExc("Status code %d on url %s" % (req.status_code, url))`
			`return req`
else totaldl 1 2015-05-15 05:40:19 +00:00
			`##############################################################################`
			`##`
else 2016-03-07 20:25:50 +00:00			`def handle_gfycat(url, customname=None):`
			`print('Gfycat')`
			`name = url.split('/')[-1]`
			`name = name.split('.')[0]`
			`if customname:`
			`filename = customname`
			`else:`
			`filename = name`

			`if GFYCAT_MP4:`
			`name += '.mp4'`
			`filename += '.mp4'`
			`else:`
			`name += '.webm'`
			`filename += '.webm'`

			`for subdomain in GFYCAT_SUBDOMAINS:`
			`url = 'http://%s.gfycat.com/%s' % (subdomain, name)`
			`try:`
			`return download_file(url, filename)`
			`except StatusExc:`
			`pass`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`def handle_liveleak(url, customname=None):`
			`print('Liveleak')`
			`if customname:`
			`name = customname`
			`else:`
			`name = url.split('=')[1]`
			`name += '.mp4'`
			`pagedata = request_get(url)`
			`pagedata = pagedata.text`
			`if LIVELEAK_YOUTUBEIFRAME in pagedata:`
			`pagedata = pagedata.split('\n')`
			`pagedata = [line for line in pagedata if LIVELEAK_YOUTUBEIFRAME in line]`
			`pagedata = pagedata[0]`
			`pagedata = pagedata.split('src="')[1]`
			`pagedata = pagedata.split('"')[0]`
			`print('\tFound youtube embed')`
			`handle_master(pagedata, customname=customname)`
			`else:`
			`pagedata = pagedata.split('file: "')[1]`
			`pagedata = pagedata.split('",')[0]`
			`original = pagedata`
			`pagedata = pagedata.split('.')`
			`for spoti in range(len(pagedata)):`
			`if 'h264_' in pagedata[spoti]:`
			`pagedata[spoti] = 'LIVELEAKRESOLUTION'`
			`pagedata = '.'.join(pagedata)`
			`for res in LIVELEAK_RESOLUTIONS:`
			`url = pagedata.replace('LIVELEAKRESOLUTION', res)`
			`try:`
			`return download_file(url, name)`
			`except StatusExc:`
			`pass`
			`return download_file(original, name)`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`def handle_imgur_html(url):`
			`print('Imgur')`
			`pagedata = request_get(url)`
			`pagedata = pagedata.text.replace(' ', '')`
			`pagedata = pagedata.split('\n')`
			`pagedata = [line for line in pagedata if IMGUR_ALBUM_INDV in line]`
			`pagedata = [line.split('content="')[1] for line in pagedata]`
			`links = [line.split('"')[0] for line in pagedata]`
			`links = [line.split('?')[0] for line in links]`
			`print(links)`
			`return links`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`def handle_imgur(url, albumid='', customname=None):`
			`print('Imgur')`
			`name = url.split('/')[-1]`
			`if 'imgur.com' in name:`
			`# This link doesn't appear to have an image id`
			`return`

			`url = url.replace('/gallery/', '/a/')`
			`basename = name.split('.')[0]`
			`if '.' in name:`
			`# This is a direct image link`
			`if customname:`
			`# replace the imgur ID with the customname, keep ext.`
			`name = '%s.%s' % (customname, name.split('.')[-1])`
			`if albumid and albumid != basename:`

			`if IMGUR_ALBUMFOLDERS:`

else 2016-05-10 08:00:29 +00:00			`os.makedirs(DOWNLOAD_DIRECTORY + albumid, exist_ok=True)`
else 2016-03-07 20:25:50 +00:00			`localpath = '%s\\%s' % (albumid, name)`

			`else:`
			`localpath = '%s_%s' % (albumid, name)`

			`else:`
			`localpath = name`

			`return download_file(url, localpath)`

			`else:`
			`# Not a direct image link, let's read the html.`
			`images = handle_imgur_html(url)`
			`if customname:`
			`name = customname`
			`print('\tFound %d images' % len(images))`

			`localfiles = []`
			`if len(images) > 1:`
			`for imagei in range(len(images)):`
			`image = images[imagei]`
			`iname = image.split('/')[-1]`
			`iname = iname.split('.')[0]`
			`x = handle_imgur(image, albumid=name, customname='%d_%s' % (imagei, iname))`
			`localfiles.append(x)`
			`else:`
			`x = handle_imgur(images[0], customname=name)`
			`localfiles.append(x)`
			`return localfiles`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`def handle_twitter(url, customname=None):`
			`print('Twitter')`
			`pagedata = request_get(url)`
			`pagedata = pagedata.text`

			`idnumber = url.split('status/')[1].split('/')[0]`
			`if customname:`
			`name = customname`
			`else:`
			`name = idnumber`
			`customname = idnumber`
			`tweetpath = '%s.html' % (DOWNLOAD_DIRECTORY + name)`
			`psplit = '<p class="TweetTextSize'`
			`tweettext = pagedata.split(psplit)[1]`
			`tweettext = tweettext.split('</p>')[0]`
			`tweettext = psplit + tweettext + '</p>'`
			`tweettext = '<html><body>%s</body></html>' % tweettext`
			`tweettext = tweettext.replace('/hashtag/', 'http://twitter.com/hashtag/')`
			`tweethtml = open(tweetpath, 'w', encoding='utf-8')`
			`tweethtml.write(tweettext)`
			`tweethtml.close()`
			`print('\tSaved tweet text')`
			`try:`
			`link = pagedata.split('data-url="')[1]`
			`link = link.split('"')[0]`
			`if link != url:`
			`handle_master(link, customname=customname)`
			`return tweetpath`
			`except IndexError:`
			`try:`
			`link = pagedata.split('data-expanded-url="')[1]`
			`link = link.split('"')[0]`
			`if link != url:`
			`handle_master(link, customname=customname)`
			`return tweetpath`
			`except IndexError:`
			`pass`
			`return tweetpath`
			`print('\tNo media detected')`

			`def handle_vidble(url, customname=None):`
			`print('Vidble')`
			`if '/album/' in url:`
			`pagedata = request_get(url)`
			`pagedata.raise_for_status()`
			`pagedata = pagedata.text`
			`soup = bs4.BeautifulSoup(pagedata)`
			`images = soup.find_all('img')`
			`images = [i for i in images if i.attrs.get('src', None)]`
			`images = [i.attrs['src'] for i in images]`
			`images = [i for i in images if '/assets/' not in i]`
			`images = [i for i in images if i[0] == '/']`
			`if customname:`
			`folder = customname`
			`else:`
			`folder = url.split('/album/')[1].split('/')[0]`
			`for (index, image) in enumerate(images):`
			`name = image.split('/')[-1]`
			`localname = '{folder}\\{index}_{name}'.format(folder=folder, index=index, name=name)`
			`image = 'https://vidble.com' + image`
else 2016-07-05 07:24:08 +00:00			`image = image.replace('_med', '')`
else 2016-03-07 20:25:50 +00:00			`download_file(image, localname)`
			`else:`
			`localname = url.split('/')[-1]`
			`extension = os.path.splitext(localname)[1]`
			`localname = customname + extension`
			`download_file(url, localname)`
else totaldl 1 2015-05-15 05:40:19 +00:00
else It's been a while since I updated this. 2015-06-26 04:03:45 +00:00			`def handle_vidme(url, customname=None):`
else 2016-03-07 20:25:50 +00:00			`print('Vidme')`
			`if customname is None:`
			`customname = url.split('/')[-1]+'.mp4'`
			`pagedata = request_get(url)`
			`pagedata = pagedata.text`
			`pagedata = pagedata.split('\n')`
			`pagedata = [l for l in pagedata if '.mp4' in l and 'og:video:url' in l]`
			`pagedata = pagedata[0]`
			`pagedata = pagedata.split('content="')[1].split('"')[0]`
			`pagedata = pagedata.replace('&', '&')`
			`headers = {'Referer': 'https://vid.me/',`
			`'Range':'bytes=0-',`
			`'Host':'d1wst0behutosd.cloudfront.net',`
			`'Cache-Control':'max-age=0'}`

			`return download_file(pagedata, customname, headers=headers)`
else It's been a while since I updated this. 2015-06-26 04:03:45 +00:00
else totaldl 3 2015-05-15 21:46:32 +00:00			`def handle_vimeo(url, customname=None):`
else 2016-03-07 20:25:50 +00:00			`print('Vimeo')`
			`name = url.split('/')[-1]`
			`name = name.split('?')[0]`
			`try:`
			`int(name)`
			`except ValueError as e:`
			`print('Could not identify filename of %s' % url)`
			`raise e`
			`url = 'http://player.vimeo.com/video/%s' % name`
			`pagedata = request_get(url)`
			`pagedata = pagedata.text`
			`pagedata = pagedata.replace('</script>', '<script')`
			`pagedata = pagedata.split('<script>')`
			`for chunk in pagedata:`
			`if VIMEO_DICT_START in chunk:`
			`break`
			`chunk = chunk.split(VIMEO_DICT_START)[1]`
			`chunk = chunk.split(VIMEO_DICT_END)[0]`
			`chunk = json.loads(chunk)`

			`for priority in VIMEO_PRIORITY:`
			`if priority in chunk:`
			`fileurl = chunk[priority]['url']`
			`break`
			`if customname:`
			`filename = customname + '.mp4'`
			`else:`
			`filename = name + '.mp4'`
			`return download_file(fileurl, filename)`
else totaldl 1 2015-05-15 05:40:19 +00:00
else totaldl 3 2015-05-15 21:46:32 +00:00			`def handle_youtube(url, customname=None):`
else 2016-03-07 20:25:50 +00:00			`print('Youtube')`
			`url = url.replace('&', '&')`
			`url = url.replace('feature=player_embedded&', '')`
			`url = url.replace('&feature=player_embedded', '')`
			`if not customname:`
			`os.system(YOUTUBE_DL_FORMAT.format(url=url, dir=DOWNLOAD_DIRECTORY, name='%(title)s'))`
			`return`
			`os.system(YOUTUBE_DL_FORMAT.format(url=url, dir=DOWNLOAD_DIRECTORY, name=customname))`
			`if DOWNLOAD_DIRECTORY:`
			`return '%s/%s.mp4' % (DOWNLOAD_DIRECTORY, customname)`
			`return '%s.mp4' % customname`
else totaldl twitter 2015-05-16 22:44:25 +00:00
else totaldl 3 2015-05-15 21:46:32 +00:00			`def handle_generic(url, customname=None):`
else 2016-03-07 20:25:50 +00:00			`print('Generic')`
			`try:`
else 2016-05-10 08:00:29 +00:00			`remote_name = url.split('/')[-1]`
else 2016-03-07 20:25:50 +00:00			`if customname:`
			`name = customname`
			`else:`
else 2016-05-10 08:00:29 +00:00			`name = remote_name`
else 2016-03-07 20:25:50 +00:00
			`base = name.split('.')[0]`
else 2016-05-10 08:00:29 +00:00			`if '.' in name:`
			`ext = name.split('.')[-1]`
			`elif '.' in remote_name:`
			`ext = remote_name.split('.')[-1]`

else 2016-03-07 20:25:50 +00:00			`if ext in [base, '']:`
			`ext = 'html'`
			`print(base)`
			`print(ext)`

			`name = '%s.%s' % (base, ext)`

			`return download_file(url, name)`
			`except:`
			`pass`
else totaldl 1 2015-05-15 05:40:19 +00:00			`##`
			`##############################################################################`

			`HANDLERS = {`
else 2016-03-07 20:25:50 +00:00			`'gfycat.com': handle_gfycat,`
			`'imgur.com': handle_imgur,`
			`'liveleak.com': handle_liveleak,`
			`'vid.me': handle_vidme,`
			`'vidble.com': handle_vidble,`
			`'vimeo.com': handle_vimeo,`
			`'youtube.com': handle_youtube,`
			`'youtu.be': handle_youtube,`
			`'twitter.com': handle_twitter`
			`}`
else totaldl 1 2015-05-15 05:40:19 +00:00
else totaldl 3 2015-05-15 21:46:32 +00:00			`def handle_master(url, customname=None):`
else 2016-03-07 20:25:50 +00:00			`print('Handling %s' % url)`
			`for handlerkey in HANDLERS:`
			`if handlerkey.lower() in url.lower():`
			`return HANDLERS[handlerkey](url, customname=customname)`
			`if DO_GENERIC:`
			`return handle_generic(url, customname=customname)`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2015-05-16 10:31:00 +00:00			`def test_imgur():`
else 2016-03-07 20:25:50 +00:00			`# Imgur gallery album`
			`handle_master('http://imgur.com/gallery/s4WLG')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`# Imgur standard album with customname`
			`handle_master('http://imgur.com/a/s4WLG', customname='album')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`# Imgur indirect`
			`handle_master('http://imgur.com/gvJUct0')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`# Imgur indirect single with customname`
			`handle_master('http://imgur.com/gvJUct0', customname='indirect')`
else totaldl 3 2015-05-15 21:46:32 +00:00
else 2016-03-07 20:25:50 +00:00			`# Imgur direct single`
			`handle_master('http://i.imgur.com/gvJUct0.jpg')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2015-05-16 10:31:00 +00:00			`def test_gfycat():`
else 2016-03-07 20:25:50 +00:00			`# Gfycat direct .gif`
			`handle_master('http://giant.gfycat.com/FatherlyBruisedIberianchiffchaff.gif')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`# Gfycat general link`
			`handle_master('http://www.gfycat.com/RawWetFlatcoatretriever')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`# Gfycat general link with customname`
			`handle_master('http://www.gfycat.com/RawWetFlatcoatretriever', customname='gfycatgeneral')`
else totaldl 3 2015-05-15 21:46:32 +00:00
else 2015-05-16 10:31:00 +00:00			`def test_vimeo():`
else 2016-03-07 20:25:50 +00:00			`# Vimeo standard link`
			`handle_master('https://vimeo.com/109405701')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`# Vimeo player link with customname`
			`handle_master('https://player.vimeo.com/video/109405701', customname='vimeoplayer')`
else totaldl 3 2015-05-15 21:46:32 +00:00
else 2015-05-16 10:31:00 +00:00			`def test_liveleak():`
else 2016-03-07 20:25:50 +00:00			`# LiveLeak standard link`
			`handle_master('http://www.liveleak.com/view?i=9d1_1429192014')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`# Liveleak article with youtube embed`
			`handle_master('http://www.liveleak.com/view?i=ab8_1367941301')`
else totaldl 5 2015-05-16 00:01:23 +00:00
else 2016-03-07 20:25:50 +00:00			`# LiveLeak standard link with customname`
			`handle_master('http://www.liveleak.com/view?i=9d1_1429192014', customname='liveleak')`
else totaldl 3 2015-05-15 21:46:32 +00:00
else 2015-05-16 10:31:00 +00:00			`def test_youtube():`
else 2016-03-07 20:25:50 +00:00			`# Youtube standard link`
			`handle_master('https://www.youtube.com/watch?v=bEgeh5hA5ko')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`# Youtube short link`
			`handle_master('https://youtu.be/GjOBTstnW20', customname='youtube')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`# Youtube player embed link`
			`handle_master('https://www.youtube.com/watch?feature=player_embedded&v=bEgeh5hA5ko')`
else totaldl 3 2015-05-15 21:46:32 +00:00
else totaldl twitter 2015-05-16 22:44:25 +00:00			`def test_twitter():`
else 2016-03-07 20:25:50 +00:00			`# Tiwtter with twitter-image embed`
			`handle_master('https://twitter.com/PetoLucem/status/599493836214272000')`
else totaldl twitter 2015-05-16 22:44:25 +00:00
else 2016-03-07 20:25:50 +00:00			`# Twitter with twitter-image embed`
			`handle_master('https://twitter.com/Jalopnik/status/598287843128188929')`
else totaldl twitter 2015-05-16 22:44:25 +00:00
else 2016-03-07 20:25:50 +00:00			`# Twitter with twitter-image embed and customname`
			`handle_master('https://twitter.com/Jalopnik/status/598287843128188929', customname='twits')`
else totaldl twitter 2015-05-16 22:44:25 +00:00
else 2016-03-07 20:25:50 +00:00			`# Twitter with youtube embed`
			`handle_master('https://twitter.com/cp_orange_x3/status/599705117420457984')`
else totaldl twitter 2015-05-16 22:44:25 +00:00
else 2016-03-07 20:25:50 +00:00			`# Twitter plain text`
			`handle_master('https://twitter.com/cp_orange_x3/status/599700702382817280')`
else totaldl twitter 2015-05-16 22:44:25 +00:00
else 2016-03-07 20:25:50 +00:00			`# Twitter plain text`
			`handle_master('https://twitter.com/SyriacMFS/status/556513635913437184')`
else textpixel 2015-05-18 06:48:27 +00:00
else 2016-03-07 20:25:50 +00:00			`# Twitter with arabic characters`
			`handle_master('https://twitter.com/HadiAlabdallah/status/600885154991706113')`
else 2015-06-03 03:30:35 +00:00
else 2015-05-16 10:31:00 +00:00			`def test_generic():`
else 2016-03-07 20:25:50 +00:00			`# Some link that might work`
			`handle_master('https://raw.githubusercontent.com/voussoir/reddit/master/SubredditBirthdays/show/statistics.txt')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else 2016-03-07 20:25:50 +00:00			`# Some link that might work with customname`
			`handle_master('https://raw.githubusercontent.com/voussoir/reddit/master/SubredditBirthdays/show/statistics.txt', customname='sss')`
else totaldl 3 2015-05-15 21:46:32 +00:00
else 2016-03-07 20:25:50 +00:00			`# Some link that might work`
			`handle_master('https://github.com/voussoir/reddit/tree/master/SubredditBirthdays/show')`
else totaldl 1 2015-05-15 05:40:19 +00:00
else totaldl 1 2015-05-15 05:43:47 +00:00			`if __name__ == '__main__':`
else 2016-03-07 20:25:50 +00:00			`if len(sys.argv) > 1:`
			`handle_master(sys.argv[1])`
			`else:`
			`#test_imgur()`
			`#test_gfycat()`
			`#test_vimeo()`
			`test_liveleak()`
			`test_youtube()`
			`#test_twitter()`
			`#test_generic()`
			`pass`